diff --git "a/perplexity25/3510097.out" "b/perplexity25/3510097.out" new file mode 100644--- /dev/null +++ "b/perplexity25/3510097.out" @@ -0,0 +1,40508 @@ +Model parameters: d_model 2560 ffw_size 10240 kv_size 128 n_heads 20 n_layers 34 +Megatron-DeepSpeed/pretrain_gpt.py --tensor-model-parallel-size 1 --pipeline-model-parallel-size 1 --num-layers 34 --hidden-size 2560 --num-attention-heads 20 --kv-channels 128 --ffn-hidden-size 10240 --seq-length 2048 --max-position-embeddings 2048 --micro-batch-size 2 --global-batch-size 512 --train-samples 1 --vocab-file gpt2/vocab.json --merge-file gpt2/merges.txt --clip-grad 1.0 --kill-switch-path kill-switch-2b855b55bc4perplexity25val --bf16 --optimizer adam --adam-beta1 0.9 --adam-beta2 0.999 --adam-eps 1e-8 --lr 2e-4 --min-lr 2e-5 --lr-decay-style cosine --lr-decay-samples 1 --lr-warmup-samples 0 --clip-grad 1.0 --weight-decay 1e-1 --override-lr-scheduler --reset-progress --no-load-optim --log-interval 10 --save-interval 1000 --eval-interval 1 --eval-iters 100 --eval-only true --tensorboard-dir tensorboard_2b855b55bc4perplexity25val --tensorboard-queue-size 5 --log-timers-to-tensorboard --log-batch-size-to-tensorboard --log-validation-ppl-to-tensorboard --save lm1-2b8-55b-c4-repetitions/perplexity25 --load lm1-2b8-55b-c4-repetitions/perplexity25 --train-weighted-split-paths-path train1b5.txt --valid-weighted-split-paths-path val.txt --data-impl mmap --deepspeed --deepspeed_config ds_configs/3510097.json --zero-stage 0 +START 3510097: Sat 13 May 2023 03:23:43 AM EEST + 0: + 0: + 0: ======================= ROCm System Management Interface ======================= + 0: ================================= Concise Info ================================= + 0: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 0: 0 43.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 1 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: 2 42.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: 4 41.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: 6 37.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: ================================================================================ + 0: ============================= End of ROCm SMI Log ============================== +21: +21: +21: ======================= ROCm System Management Interface ======================= +21: ================================= Concise Info ================================= +21: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +21: 0 44.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: 2 39.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: 4 36.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: 6 41.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: ================================================================================ +21: ============================= End of ROCm SMI Log ============================== +22: +22: +22: ======================= ROCm System Management Interface ======================= +22: ================================= Concise Info ================================= +22: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +22: 0 50.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: 2 42.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: 4 43.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 5 39.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: 6 39.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: ================================================================================ +22: ============================= End of ROCm SMI Log ============================== +20: +20: +20: ======================= ROCm System Management Interface ======================= +20: ================================= Concise Info ================================= +20: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +20: 0 52.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: 2 44.0c 100.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: 4 45.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: 6 39.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: ================================================================================ +20: ============================= End of ROCm SMI Log ============================== +27: +27: +27: ======================= ROCm System Management Interface ======================= +27: ================================= Concise Info ================================= +27: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +27: 0 46.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: 2 43.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: 4 43.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: 6 37.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: ================================================================================ +27: ============================= End of ROCm SMI Log ============================== + 8: + 8: + 8: ======================= ROCm System Management Interface ======================= + 8: ================================= Concise Info ================================= + 8: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 8: 0 47.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: 2 39.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: 4 49.0c 82.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: 6 41.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: ================================================================================ + 8: ============================= End of ROCm SMI Log ============================== +23: +23: +23: ======================= ROCm System Management Interface ======================= +23: ================================= Concise Info ================================= +23: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +23: 0 45.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 1 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: 2 41.0c 82.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: 4 42.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: 6 43.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: ================================================================================ +23: ============================= End of ROCm SMI Log ============================== +24: +24: +24: ======================= ROCm System Management Interface ======================= +24: ================================= Concise Info ================================= +24: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +24: 0 48.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 1 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: 2 39.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 3 52.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: 4 47.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: 6 41.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: ================================================================================ +24: ============================= End of ROCm SMI Log ============================== +13: +13: +13: ======================= ROCm System Management Interface ======================= +13: ================================= Concise Info ================================= +13: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +13: 0 43.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: 2 39.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: 4 43.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 5 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: 6 44.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: ================================================================================ +13: ============================= End of ROCm SMI Log ============================== +30: +30: +30: ======================= ROCm System Management Interface ======================= +30: ================================= Concise Info ================================= +30: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +30: 0 45.0c 99.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: 2 42.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: 4 43.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: 6 40.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: ================================================================================ +30: ============================= End of ROCm SMI Log ============================== +31: +31: +31: ======================= ROCm System Management Interface ======================= +31: ================================= Concise Info ================================= +31: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +31: 0 43.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 1 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: 2 43.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: 4 43.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: 6 38.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: ================================================================================ +31: ============================= End of ROCm SMI Log ============================== +25: +25: +25: ======================= ROCm System Management Interface ======================= +25: ================================= Concise Info ================================= +25: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +25: 0 44.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: 2 42.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: 4 42.0c 167.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: 6 40.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 7 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: ================================================================================ +25: ============================= End of ROCm SMI Log ============================== +17: +17: +17: ======================= ROCm System Management Interface ======================= +17: ================================= Concise Info ================================= +17: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +17: 0 40.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 1 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: 2 38.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 3 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: 4 44.0c 80.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: 6 39.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: ================================================================================ +17: ============================= End of ROCm SMI Log ============================== +10: +10: +10: ======================= ROCm System Management Interface ======================= +10: ================================= Concise Info ================================= +10: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +10: 0 47.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: 2 43.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: 4 44.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: 6 43.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: ================================================================================ +10: ============================= End of ROCm SMI Log ============================== +16: +16: +16: ======================= ROCm System Management Interface ======================= +16: ================================= Concise Info ================================= +16: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +16: 0 45.0c 99.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 1 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: 2 41.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: 4 42.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 5 40.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: 6 36.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: ================================================================================ +16: ============================= End of ROCm SMI Log ============================== + 6: + 6: + 6: ======================= ROCm System Management Interface ======================= + 6: ================================= Concise Info ================================= + 6: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 6: 0 47.0c 98.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: 2 42.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: 4 45.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: 6 41.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: ================================================================================ + 6: ============================= End of ROCm SMI Log ============================== + 3: + 3: + 3: ======================= ROCm System Management Interface ======================= + 3: ================================= Concise Info ================================= + 3: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 3: 0 45.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: 2 43.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: 4 40.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: 6 39.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: ================================================================================ + 3: ============================= End of ROCm SMI Log ============================== +19: +19: +19: ======================= ROCm System Management Interface ======================= +19: ================================= Concise Info ================================= +19: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +19: 0 45.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: 2 42.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: 4 43.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: 6 41.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: ================================================================================ +19: ============================= End of ROCm SMI Log ============================== +14: +14: +14: ======================= ROCm System Management Interface ======================= +14: ================================= Concise Info ================================= +14: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +14: 0 44.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: 2 42.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: 4 44.0c 78.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: 6 39.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: ================================================================================ +14: ============================= End of ROCm SMI Log ============================== +26: +26: +26: ======================= ROCm System Management Interface ======================= +26: ================================= Concise Info ================================= +26: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +26: 0 47.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: 2 42.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 3 39.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: 4 48.0c 82.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: 6 39.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: ================================================================================ +26: ============================= End of ROCm SMI Log ============================== + 4: + 4: + 4: ======================= ROCm System Management Interface ======================= + 4: ================================= Concise Info ================================= + 4: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 4: 0 50.0c 99.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: 2 39.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 3 39.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: 4 41.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: 6 39.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: ================================================================================ + 4: ============================= End of ROCm SMI Log ============================== + 2: + 2: + 2: ======================= ROCm System Management Interface ======================= + 2: ================================= Concise Info ================================= + 2: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 2: 0 44.0c 98.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: 2 36.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: 4 40.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: 6 37.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: ================================================================================ + 2: ============================= End of ROCm SMI Log ============================== +18: +18: +18: ======================= ROCm System Management Interface ======================= +18: ================================= Concise Info ================================= +18: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +18: 0 45.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: 2 37.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: 4 46.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: 6 36.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: ================================================================================ +18: ============================= End of ROCm SMI Log ============================== + 9: + 9: + 9: ======================= ROCm System Management Interface ======================= + 9: ================================= Concise Info ================================= + 9: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 9: 0 38.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: 2 38.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: 4 41.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 5 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: 6 41.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: ================================================================================ + 9: ============================= End of ROCm SMI Log ============================== + 5: + 5: + 5: ======================= ROCm System Management Interface ======================= + 5: ================================= Concise Info ================================= + 5: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 5: 0 45.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: 2 42.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: 4 41.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 5 38.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: 6 39.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: ================================================================================ + 5: ============================= End of ROCm SMI Log ============================== +28: +28: +28: ======================= ROCm System Management Interface ======================= +28: ================================= Concise Info ================================= +28: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +28: 0 48.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: 2 40.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 3 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: 4 45.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: 6 43.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: ================================================================================ +28: ============================= End of ROCm SMI Log ============================== +15: +15: +15: ======================= ROCm System Management Interface ======================= +15: ================================= Concise Info ================================= +15: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +15: 0 44.0c 98.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 1 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: 2 44.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: 4 47.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 5 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: 6 40.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: ================================================================================ +15: ============================= End of ROCm SMI Log ============================== +11: +11: +11: ======================= ROCm System Management Interface ======================= +11: ================================= Concise Info ================================= +11: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +11: 0 47.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 1 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: 2 39.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: 4 42.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 5 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: 6 44.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: ================================================================================ +11: ============================= End of ROCm SMI Log ============================== + 7: + 7: + 7: ======================= ROCm System Management Interface ======================= + 7: ================================= Concise Info ================================= + 7: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 7: 0 40.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 1 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: 2 39.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 3 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: 4 48.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: 6 36.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: ================================================================================ + 7: ============================= End of ROCm SMI Log ============================== +12: +12: +12: ======================= ROCm System Management Interface ======================= +12: ================================= Concise Info ================================= +12: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +12: 0 44.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: 2 41.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 3 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: 4 45.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: 6 41.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 7 38.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: ================================================================================ +12: ============================= End of ROCm SMI Log ============================== + 1: + 1: + 1: ======================= ROCm System Management Interface ======================= + 1: ================================= Concise Info ================================= + 1: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 1: 0 47.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: 2 39.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 3 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: 4 41.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: 6 41.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: ================================================================================ + 1: ============================= End of ROCm SMI Log ============================== +29: +29: +29: ======================= ROCm System Management Interface ======================= +29: ================================= Concise Info ================================= +29: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +29: 0 47.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: 2 42.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 3 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: 4 40.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 5 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: 6 43.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: ================================================================================ +29: ============================= End of ROCm SMI Log ============================== + 4: Launching on nid005421 (4/32), master nid005155 port 9999, GPUs 8, CUDA: True +30: Launching on nid007235 (30/32), master nid005155 port 9999, GPUs 8, CUDA: True + 8: Launching on nid005425 (8/32), master nid005155 port 9999, GPUs 8, CUDA: True +13: Launching on nid005430 (13/32), master nid005155 port 9999, GPUs 8, CUDA: True +24: Launching on nid005905 (24/32), master nid005155 port 9999, GPUs 8, CUDA: True + 5: Launching on nid005422 (5/32), master nid005155 port 9999, GPUs 8, CUDA: True +26: Launching on nid006867 (26/32), master nid005155 port 9999, GPUs 8, CUDA: True +31: Launching on nid007236 (31/32), master nid005155 port 9999, GPUs 8, CUDA: True + 2: Launching on nid005166 (2/32), master nid005155 port 9999, GPUs 8, CUDA: True +21: Launching on nid005902 (21/32), master nid005155 port 9999, GPUs 8, CUDA: True +27: Launching on nid006868 (27/32), master nid005155 port 9999, GPUs 8, CUDA: True +25: Launching on nid005906 (25/32), master nid005155 port 9999, GPUs 8, CUDA: True + 9: Launching on nid005426 (9/32), master nid005155 port 9999, GPUs 8, CUDA: True +16: Launching on nid005434 (16/32), master nid005155 port 9999, GPUs 8, CUDA: True + 3: Launching on nid005266 (3/32), master nid005155 port 9999, GPUs 8, CUDA: True +10: Launching on nid005427 (10/32), master nid005155 port 9999, GPUs 8, CUDA: True + 0: Launching on nid005155 (0/32), master nid005155 port 9999, GPUs 8, CUDA: True + 6: Launching on nid005423 (6/32), master nid005155 port 9999, GPUs 8, CUDA: True +22: Launching on nid005903 (22/32), master nid005155 port 9999, GPUs 8, CUDA: True +20: Launching on nid005568 (20/32), master nid005155 port 9999, GPUs 8, CUDA: True +17: Launching on nid005435 (17/32), master nid005155 port 9999, GPUs 8, CUDA: True +19: Launching on nid005567 (19/32), master nid005155 port 9999, GPUs 8, CUDA: True +18: Launching on nid005456 (18/32), master nid005155 port 9999, GPUs 8, CUDA: True +23: Launching on nid005904 (23/32), master nid005155 port 9999, GPUs 8, CUDA: True + 7: Launching on nid005424 (7/32), master nid005155 port 9999, GPUs 8, CUDA: True +14: Launching on nid005431 (14/32), master nid005155 port 9999, GPUs 8, CUDA: True +11: Launching on nid005428 (11/32), master nid005155 port 9999, GPUs 8, CUDA: True +12: Launching on nid005429 (12/32), master nid005155 port 9999, GPUs 8, CUDA: True +15: Launching on nid005432 (15/32), master nid005155 port 9999, GPUs 8, CUDA: True +28: Launching on nid007232 (28/32), master nid005155 port 9999, GPUs 8, CUDA: True + 1: Launching on nid005165 (1/32), master nid005155 port 9999, GPUs 8, CUDA: True +29: Launching on nid007233 (29/32), master nid005155 port 9999, GPUs 8, CUDA: True + 0: using world size: 256, data-parallel-size: 256, tensor-model-parallel size: 1, pipeline-model-parallel size: 1 + 0: accumulate and all-reduce gradients in fp32 for bfloat16 data type. + 0: using torch.bfloat16 for parameters ... + 0: ------------------------ arguments ------------------------ + 0: abort_on_unmet_fused_kernel_constraints ......... False + 0: accumulate_allreduce_grads_in_fp32 .............. True + 0: adam_beta1 ...................................... 0.9 + 0: adam_beta2 ...................................... 0.999 + 0: adam_eps ........................................ 1e-08 + 0: adlr_autoresume ................................. False + 0: adlr_autoresume_interval ........................ 1000 + 0: apply_query_key_layer_scaling ................... True + 0: apply_residual_connection_post_layernorm ........ False + 0: attention_dropout ............................... 0.1 + 0: attention_softmax_in_fp32 ....................... False + 0: bert_binary_head ................................ True + 0: bert_load ....................................... None + 0: bf16 ............................................ True + 0: bias_dropout_fusion ............................. True + 0: bias_gelu_fusion ................................ True + 0: biencoder_projection_dim ........................ 0 + 0: biencoder_shared_query_context_model ............ False + 0: block_data_path ................................. None + 0: checkpoint_activations .......................... False + 0: checkpoint_in_cpu ............................... False + 0: checkpoint_num_layers ........................... 1 + 0: clip_grad ....................................... 1.0 + 0: codecarbon_dir .................................. None + 0: consumed_train_samples .......................... 0 + 0: consumed_train_tokens ........................... 0 + 0: consumed_valid_samples .......................... 0 + 0: contigious_checkpointing ........................ False + 0: cpu_optimizer ................................... False + 0: cpu_torch_adam .................................. False + 0: curriculum_learning ............................. False + 0: data_impl ....................................... mmap + 0: data_parallel_size .............................. 256 + 0: data_path ....................................... None + 0: dataloader_type ................................. single + 0: DDP_impl ........................................ local + 0: decoder_seq_length .............................. None + 0: deepscale ....................................... False + 0: deepscale_config ................................ None + 0: deepspeed ....................................... True + 0: deepspeed_activation_checkpointing .............. False + 0: deepspeed_config ................................ ds_configs/3510097.json + 0: deepspeed_mpi ................................... False + 0: distribute_checkpointed_activations ............. False + 0: distributed_backend ............................. nccl + 0: embed_layernorm ................................. False + 0: embedding_path .................................. None + 0: encoder_seq_length .............................. 2048 + 0: eod_mask_loss ................................... False + 0: eval_interval ................................... 1 + 0: eval_iters ...................................... 100 + 0: eval_only ....................................... True + 0: evidence_data_path .............................. None + 0: exit_duration_in_mins ........................... None + 0: exit_interval ................................... None + 0: ffn_hidden_size ................................. 10240 + 0: finetune ........................................ False + 0: fp16 ............................................ False + 0: fp16_lm_cross_entropy ........................... False + 0: fp32_residual_connection ........................ False + 0: gigaflos_no_embeds .............................. 0 + 0: global_batch_size ............................... 512 + 0: glu_activation .................................. None + 0: hidden_dropout .................................. 0.1 + 0: hidden_size ..................................... 2560 + 0: hysteresis ...................................... 2 + 0: ict_head_size ................................... None + 0: ict_load ........................................ None + 0: img_dim ......................................... 224 + 0: indexer_batch_size .............................. 128 + 0: indexer_log_interval ............................ 1000 + 0: inference ....................................... False + 0: init_method_std ................................. 0.02 + 0: init_method_xavier_uniform ...................... False + 0: initial_loss_scale .............................. 4294967296 + 0: kill_switch_path ................................ kill-switch-2b855b55bc4perplexity25val + 0: kv_channels ..................................... 128 + 0: layer_norm_fusion ............................... True + 0: layernorm_epsilon ............................... 1e-05 + 0: lazy_mpu_init ................................... None + 0: load ............................................ lm1-2b8-55b-c4-repetitions/perplexity25 + 0: local_rank ...................................... None + 0: log_batch_size_to_tensorboard ................... True + 0: log_interval .................................... 10 + 0: log_learning_rate_to_tensorboard ................ True + 0: log_level ....................................... None + 0: log_level_replica ............................... None + 0: log_loss_scale_to_tensorboard ................... True + 0: log_num_zeros_in_grad ........................... False + 0: log_params_norm ................................. False + 0: log_path ........................................ None + 0: log_timers_to_tensorboard ....................... True + 0: log_validation_ppl_to_tensorboard ............... True + 0: loss_on_targets_only ............................ False + 0: loss_scale ...................................... None + 0: loss_scale_window ............................... 1000 + 0: lr .............................................. 0.0002 + 0: lr_decay_iters .................................. None + 0: lr_decay_samples ................................ 1 + 0: lr_decay_style .................................. cosine + 0: lr_decay_tokens ................................. None + 0: lr_warmup_fraction .............................. None + 0: lr_warmup_iters ................................. 0 + 0: lr_warmup_samples ............................... 0 + 0: make_vocab_size_divisible_by .................... 128 + 0: mask_prob ....................................... 0.15 + 0: masked_softmax_fusion ........................... True + 0: max_position_embeddings ......................... 2048 + 0: mean_noise_span_length .......................... None + 0: memory_centric_tiled_linear ..................... False + 0: merge_file ...................................... gpt2/merges.txt + 0: micro_batch_size ................................ 2 + 0: min_loss_scale .................................. 1.0 + 0: min_lr .......................................... 2e-05 + 0: mmap_warmup ..................................... False + 0: no_load_optim ................................... True + 0: no_load_rng ..................................... None + 0: no_save_optim ................................... None + 0: no_save_rng ..................................... None + 0: noise_density ................................... None + 0: num_attention_heads ............................. 20 + 0: num_channels .................................... 3 + 0: num_classes ..................................... 1000 + 0: num_layers ...................................... 34 + 0: num_layers_per_virtual_pipeline_stage ........... None + 0: num_workers ..................................... 2 + 0: onnx_safe ....................................... None + 0: openai_gelu ..................................... False + 0: optimizer ....................................... adam + 0: optimizer_fusion ................................ True + 0: override_lr_scheduler ........................... True + 0: pad_vocab_size_to ............................... None + 0: params_dtype .................................... torch.bfloat16 + 0: partition_activations ........................... False + 0: patch_dim ....................................... 16 + 0: pipeline_model_parallel_size .................... 1 + 0: position_embedding_type ......................... PositionEmbeddingType.absolute + 0: pp_partition_method ............................. None + 0: profile_backward ................................ False + 0: query_in_block_prob ............................. 0.1 + 0: rampup_batch_size ............................... None + 0: rank ............................................ 0 + 0: remote_device ................................... none + 0: reset_attention_mask ............................ False + 0: reset_position_ids .............................. False + 0: reset_progress .................................. True + 0: retriever_report_topk_accuracies ................ [] + 0: retriever_score_scaling ......................... False + 0: retriever_seq_length ............................ 256 + 0: reweight_loss_based_on_position_frequency ....... False + 0: sample_rate ..................................... 1.0 + 0: save ............................................ lm1-2b8-55b-c4-repetitions/perplexity25 + 0: save_interval ................................... 1000 + 0: scatter_gather_tensors_in_pipeline .............. True + 0: scattered_embeddings ............................ False + 0: seed ............................................ 1234 + 0: seq_length ...................................... 2048 + 0: sgd_momentum .................................... 0.9 + 0: short_seq_prob .................................. 0.1 + 0: skip_train_iteration_range ...................... None + 0: split ........................................... None + 0: split_transformers .............................. False + 0: sync_tp_duplicated_parameters ................... False + 0: synchronize_each_layer .......................... False + 0: tensor_model_parallel_size ...................... 1 + 0: tensorboard_dir ................................. tensorboard_2b855b55bc4perplexity25val + 0: tensorboard_log_interval ........................ 1 + 0: tensorboard_queue_size .......................... 5 + 0: test_weighted_split_paths ....................... None + 0: test_weighted_split_paths_path .................. None + 0: tile_factor ..................................... 1 + 0: titles_data_path ................................ None + 0: tokenizer_name_or_path .......................... None + 0: tokenizer_type .................................. GPT2BPETokenizer + 0: train_iters ..................................... None + 0: train_samples ................................... 1 + 0: train_tokens .................................... None + 0: train_weighted_split_names ...................... ['train'] + 0: train_weighted_split_paths ...................... [['/scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_1B5_text_document']] + 0: train_weighted_split_paths_path ................. None + 0: train_weighted_split_splits ..................... [['0:1']] + 0: train_weighted_split_weights .................... [['1.0']] + 0: universal_checkpoint ............................ False + 0: use_bnb_optimizer ............................... False + 0: use_checkpoint_lr_scheduler ..................... False + 0: use_contiguous_buffers_in_ddp ................... True + 0: use_cpu_initialization .......................... None + 0: use_one_sent_docs ............................... False + 0: use_pin_memory .................................. False + 0: valid_num_workers ............................... 2 + 0: valid_weighted_split_names ...................... ['validation'] + 0: valid_weighted_split_paths ...................... [['/scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document']] + 0: valid_weighted_split_paths_path ................. None + 0: valid_weighted_split_splits ..................... [['0:1']] + 0: valid_weighted_split_weights .................... [['1.0']] + 0: virtual_pipeline_model_parallel_size ............ None + 0: vocab_extra_ids ................................. 0 + 0: vocab_file ...................................... gpt2/vocab.json + 0: weight_decay .................................... 0.1 + 0: world_size ...................................... 256 + 0: zero_allgather_bucket_size ...................... 0.0 + 0: zero_contigious_gradients ....................... False + 0: zero_reduce_bucket_size ......................... 0.0 + 0: zero_reduce_scatter ............................. False + 0: zero_stage ...................................... 0 + 0: -------------------- end of arguments --------------------- + 0: setting number of micro-batches to constant 1 + 0: > building GPT2BPETokenizer tokenizer ... + 0: > padded vocab (size: 50257) with 47 dummy tokens (new size: 50304) + 0: DeepSpeed general environment info: + 0: torch install path ............... ['/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch'] + 0: torch version .................... 1.13.0+rocm5.2 + 0: torch cuda version ............... None + 0: torch hip version ................ 5.2.21151-afdc89f8 + 0: nvcc version ..................... None + 0: deepspeed install path ........... ['/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/deepspeed'] + 0: deepspeed info ................... 0.7.5, unknown, unknown + 0: deepspeed wheel compiled w. ...... torch 1.13, hip 5.1 + 0: **** Git info for Megatron: git_hash=unknown git_branch=unknown **** + 0: > initializing torch distributed ... + 0: [2023-05-13 03:26:53,751] [INFO] [comm.py:633:init_distributed] Initializing TorchBackend in DeepSpeed with backend nccl +31: > setting tensorboard ... + 0: > initializing tensor model parallel with size 1 + 0: > initializing pipeline model parallel with size 1 + 0: > setting random seeds to 1234 ... + 0: > initializing model parallel cuda seeds on global rank 0, model parallel rank 0, and data parallel rank 0 with model parallel seed: 3952 and data parallel seed: 1234 + 0: > compiling dataset index builder ... + 0: make: Entering directory '/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/data' + 0: make: Nothing to be done for 'default'. + 0: make: Leaving directory '/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/data' + 0: >>> done with dataset index builder. Compilation time: 0.097 seconds + 0: > compiling and loading fused kernels ... + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.cpp -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.cpp [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_cuda.cu -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.hip [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.h [skipped, already hipified] + 0: Total number of unsupported CUDA function calls: 0 + 0: + 0: + 0: Total number of replaced kernel launches: 87 + 0: [1/1] c++ scaled_upper_triang_masked_softmax_hip.cuda.o scaled_upper_triang_masked_softmax_hip.o -shared -L/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/lib -lc10 -lc10_hip -ltorch_cpu -ltorch_hip -ltorch -ltorch_python -L/opt/rocm/lib -lamdhip64 -o scaled_upper_triang_masked_softmax_cuda.so + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.cpp -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.cpp [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_cuda.cu -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.hip [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.h [skipped, already hipified] + 0: Total number of unsupported CUDA function calls: 0 + 0: + 0: + 0: Total number of replaced kernel launches: 63 + 0: ninja: no work to do. + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_cuda.cpp -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_cuda.cpp [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_cuda_kernel.cu -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_hip_kernel.hip [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.h [skipped, already hipified] + 0: Total number of unsupported CUDA function calls: 0 + 0: + 0: + 0: Total number of replaced kernel launches: 67 + 0: ninja: no work to do. + 0: >>> done with compiling and loading fused kernels. Compilation time: 39.425 seconds + 0: time to initialize megatron (seconds): 0.539 + 0: [after megatron is initialized] datetime: 2023-05-13 03:27:44 + 0: building GPT model ... + 0: [2023-05-13 03:27:44,692] [INFO] [utils.py:827:see_memory_usage] Before Building Model + 0: [2023-05-13 03:27:44,693] [INFO] [utils.py:828:see_memory_usage] MA 0.0 GB Max_MA 0.0 GB CA 0.0 GB Max_CA 0 GB + 0: [2023-05-13 03:27:44,693] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 40.59 GB, percent = 8.1% + 0: SEED_LAYERS=False BASE_SEED=1234 SEED_FN=None + 0: Using topology: {ProcessCoord(pipe=0, data=0, model=0): 0, ProcessCoord(pipe=0, data=1, model=0): 1, ProcessCoord(pipe=0, data=2, model=0): 2, ProcessCoord(pipe=0, data=3, model=0): 3, ProcessCoord(pipe=0, data=4, model=0): 4, ProcessCoord(pipe=0, data=5, model=0): 5, ProcessCoord(pipe=0, data=6, model=0): 6, ProcessCoord(pipe=0, data=7, model=0): 7, ProcessCoord(pipe=0, data=8, model=0): 8, ProcessCoord(pipe=0, data=9, model=0): 9, ProcessCoord(pipe=0, data=10, model=0): 10, ProcessCoord(pipe=0, data=11, model=0): 11, ProcessCoord(pipe=0, data=12, model=0): 12, ProcessCoord(pipe=0, data=13, model=0): 13, ProcessCoord(pipe=0, data=14, model=0): 14, ProcessCoord(pipe=0, data=15, model=0): 15, ProcessCoord(pipe=0, data=16, model=0): 16, ProcessCoord(pipe=0, data=17, model=0): 17, ProcessCoord(pipe=0, data=18, model=0): 18, ProcessCoord(pipe=0, data=19, model=0): 19, ProcessCoord(pipe=0, data=20, model=0): 20, ProcessCoord(pipe=0, data=21, model=0): 21, ProcessCoord(pipe=0, data=22, model=0): 22, ProcessCoord(pi + 0: pe=0, data=23, model=0): 23, ProcessCoord(pipe=0, data=24, model=0): 24, ProcessCoord(pipe=0, data=25, model=0): 25, ProcessCoord(pipe=0, data=26, model=0): 26, ProcessCoord(pipe=0, data=27, model=0): 27, ProcessCoord(pipe=0, data=28, model=0): 28, ProcessCoord(pipe=0, data=29, model=0): 29, ProcessCoord(pipe=0, data=30, model=0): 30, ProcessCoord(pipe=0, data=31, model=0): 31, ProcessCoord(pipe=0, data=32, model=0): 32, ProcessCoord(pipe=0, data=33, model=0): 33, ProcessCoord(pipe=0, data=34, model=0): 34, ProcessCoord(pipe=0, data=35, model=0): 35, ProcessCoord(pipe=0, data=36, model=0): 36, ProcessCoord(pipe=0, data=37, model=0): 37, ProcessCoord(pipe=0, data=38, model=0): 38, ProcessCoord(pipe=0, data=39, model=0): 39, ProcessCoord(pipe=0, data=40, model=0): 40, ProcessCoord(pipe=0, data=41, model=0): 41, ProcessCoord(pipe=0, data=42, model=0): 42, ProcessCoord(pipe=0, data=43, model=0): 43, ProcessCoord(pipe=0, data=44, model=0): 44, ProcessCoord(pipe=0, data=45, model=0): 45, ProcessCoord(pipe=0, data=4 + 0: 6, model=0): 46, ProcessCoord(pipe=0, data=47, model=0): 47, ProcessCoord(pipe=0, data=48, model=0): 48, ProcessCoord(pipe=0, data=49, model=0): 49, ProcessCoord(pipe=0, data=50, model=0): 50, ProcessCoord(pipe=0, data=51, model=0): 51, ProcessCoord(pipe=0, data=52, model=0): 52, ProcessCoord(pipe=0, data=53, model=0): 53, ProcessCoord(pipe=0, data=54, model=0): 54, ProcessCoord(pipe=0, data=55, model=0): 55, ProcessCoord(pipe=0, data=56, model=0): 56, ProcessCoord(pipe=0, data=57, model=0): 57, ProcessCoord(pipe=0, data=58, model=0): 58, ProcessCoord(pipe=0, data=59, model=0): 59, ProcessCoord(pipe=0, data=60, model=0): 60, ProcessCoord(pipe=0, data=61, model=0): 61, ProcessCoord(pipe=0, data=62, model=0): 62, ProcessCoord(pipe=0, data=63, model=0): 63, ProcessCoord(pipe=0, data=64, model=0): 64, ProcessCoord(pipe=0, data=65, model=0): 65, ProcessCoord(pipe=0, data=66, model=0): 66, ProcessCoord(pipe=0, data=67, model=0): 67, ProcessCoord(pipe=0, data=68, model=0): 68, ProcessCoord(pipe=0, data=69, model=0): + 0: 69, ProcessCoord(pipe=0, data=70, model=0): 70, ProcessCoord(pipe=0, data=71, model=0): 71, ProcessCoord(pipe=0, data=72, model=0): 72, ProcessCoord(pipe=0, data=73, model=0): 73, ProcessCoord(pipe=0, data=74, model=0): 74, ProcessCoord(pipe=0, data=75, model=0): 75, ProcessCoord(pipe=0, data=76, model=0): 76, ProcessCoord(pipe=0, data=77, model=0): 77, ProcessCoord(pipe=0, data=78, model=0): 78, ProcessCoord(pipe=0, data=79, model=0): 79, ProcessCoord(pipe=0, data=80, model=0): 80, ProcessCoord(pipe=0, data=81, model=0): 81, ProcessCoord(pipe=0, data=82, model=0): 82, ProcessCoord(pipe=0, data=83, model=0): 83, ProcessCoord(pipe=0, data=84, model=0): 84, ProcessCoord(pipe=0, data=85, model=0): 85, ProcessCoord(pipe=0, data=86, model=0): 86, ProcessCoord(pipe=0, data=87, model=0): 87, ProcessCoord(pipe=0, data=88, model=0): 88, ProcessCoord(pipe=0, data=89, model=0): 89, ProcessCoord(pipe=0, data=90, model=0): 90, ProcessCoord(pipe=0, data=91, model=0): 91, ProcessCoord(pipe=0, data=92, model=0): 92, Process + 0: Coord(pipe=0, data=93, model=0): 93, ProcessCoord(pipe=0, data=94, model=0): 94, ProcessCoord(pipe=0, data=95, model=0): 95, ProcessCoord(pipe=0, data=96, model=0): 96, ProcessCoord(pipe=0, data=97, model=0): 97, ProcessCoord(pipe=0, data=98, model=0): 98, ProcessCoord(pipe=0, data=99, model=0): 99, ProcessCoord(pipe=0, data=100, model=0): 100, ProcessCoord(pipe=0, data=101, model=0): 101, ProcessCoord(pipe=0, data=102, model=0): 102, ProcessCoord(pipe=0, data=103, model=0): 103, ProcessCoord(pipe=0, data=104, model=0): 104, ProcessCoord(pipe=0, data=105, model=0): 105, ProcessCoord(pipe=0, data=106, model=0): 106, ProcessCoord(pipe=0, data=107, model=0): 107, ProcessCoord(pipe=0, data=108, model=0): 108, ProcessCoord(pipe=0, data=109, model=0): 109, ProcessCoord(pipe=0, data=110, model=0): 110, ProcessCoord(pipe=0, data=111, model=0): 111, ProcessCoord(pipe=0, data=112, model=0): 112, ProcessCoord(pipe=0, data=113, model=0): 113, ProcessCoord(pipe=0, data=114, model=0): 114, ProcessCoord(pipe=0, data=115, mo + 0: del=0): 115, ProcessCoord(pipe=0, data=116, model=0): 116, ProcessCoord(pipe=0, data=117, model=0): 117, ProcessCoord(pipe=0, data=118, model=0): 118, ProcessCoord(pipe=0, data=119, model=0): 119, ProcessCoord(pipe=0, data=120, model=0): 120, ProcessCoord(pipe=0, data=121, model=0): 121, ProcessCoord(pipe=0, data=122, model=0): 122, ProcessCoord(pipe=0, data=123, model=0): 123, ProcessCoord(pipe=0, data=124, model=0): 124, ProcessCoord(pipe=0, data=125, model=0): 125, ProcessCoord(pipe=0, data=126, model=0): 126, ProcessCoord(pipe=0, data=127, model=0): 127, ProcessCoord(pipe=0, data=128, model=0): 128, ProcessCoord(pipe=0, data=129, model=0): 129, ProcessCoord(pipe=0, data=130, model=0): 130, ProcessCoord(pipe=0, data=131, model=0): 131, ProcessCoord(pipe=0, data=132, model=0): 132, ProcessCoord(pipe=0, data=133, model=0): 133, ProcessCoord(pipe=0, data=134, model=0): 134, ProcessCoord(pipe=0, data=135, model=0): 135, ProcessCoord(pipe=0, data=136, model=0): 136, ProcessCoord(pipe=0, data=137, model=0): 137, + 0: ProcessCoord(pipe=0, data=138, model=0): 138, ProcessCoord(pipe=0, data=139, model=0): 139, ProcessCoord(pipe=0, data=140, model=0): 140, ProcessCoord(pipe=0, data=141, model=0): 141, ProcessCoord(pipe=0, data=142, model=0): 142, ProcessCoord(pipe=0, data=143, model=0): 143, ProcessCoord(pipe=0, data=144, model=0): 144, ProcessCoord(pipe=0, data=145, model=0): 145, ProcessCoord(pipe=0, data=146, model=0): 146, ProcessCoord(pipe=0, data=147, model=0): 147, ProcessCoord(pipe=0, data=148, model=0): 148, ProcessCoord(pipe=0, data=149, model=0): 149, ProcessCoord(pipe=0, data=150, model=0): 150, ProcessCoord(pipe=0, data=151, model=0): 151, ProcessCoord(pipe=0, data=152, model=0): 152, ProcessCoord(pipe=0, data=153, model=0): 153, ProcessCoord(pipe=0, data=154, model=0): 154, ProcessCoord(pipe=0, data=155, model=0): 155, ProcessCoord(pipe=0, data=156, model=0): 156, ProcessCoord(pipe=0, data=157, model=0): 157, ProcessCoord(pipe=0, data=158, model=0): 158, ProcessCoord(pipe=0, data=159, model=0): 159, ProcessCoor + 0: d(pipe=0, data=160, model=0): 160, ProcessCoord(pipe=0, data=161, model=0): 161, ProcessCoord(pipe=0, data=162, model=0): 162, ProcessCoord(pipe=0, data=163, model=0): 163, ProcessCoord(pipe=0, data=164, model=0): 164, ProcessCoord(pipe=0, data=165, model=0): 165, ProcessCoord(pipe=0, data=166, model=0): 166, ProcessCoord(pipe=0, data=167, model=0): 167, ProcessCoord(pipe=0, data=168, model=0): 168, ProcessCoord(pipe=0, data=169, model=0): 169, ProcessCoord(pipe=0, data=170, model=0): 170, ProcessCoord(pipe=0, data=171, model=0): 171, ProcessCoord(pipe=0, data=172, model=0): 172, ProcessCoord(pipe=0, data=173, model=0): 173, ProcessCoord(pipe=0, data=174, model=0): 174, ProcessCoord(pipe=0, data=175, model=0): 175, ProcessCoord(pipe=0, data=176, model=0): 176, ProcessCoord(pipe=0, data=177, model=0): 177, ProcessCoord(pipe=0, data=178, model=0): 178, ProcessCoord(pipe=0, data=179, model=0): 179, ProcessCoord(pipe=0, data=180, model=0): 180, ProcessCoord(pipe=0, data=181, model=0): 181, ProcessCoord(pipe=0, da + 0: ta=182, model=0): 182, ProcessCoord(pipe=0, data=183, model=0): 183, ProcessCoord(pipe=0, data=184, model=0): 184, ProcessCoord(pipe=0, data=185, model=0): 185, ProcessCoord(pipe=0, data=186, model=0): 186, ProcessCoord(pipe=0, data=187, model=0): 187, ProcessCoord(pipe=0, data=188, model=0): 188, ProcessCoord(pipe=0, data=189, model=0): 189, ProcessCoord(pipe=0, data=190, model=0): 190, ProcessCoord(pipe=0, data=191, model=0): 191, ProcessCoord(pipe=0, data=192, model=0): 192, ProcessCoord(pipe=0, data=193, model=0): 193, ProcessCoord(pipe=0, data=194, model=0): 194, ProcessCoord(pipe=0, data=195, model=0): 195, ProcessCoord(pipe=0, data=196, model=0): 196, ProcessCoord(pipe=0, data=197, model=0): 197, ProcessCoord(pipe=0, data=198, model=0): 198, ProcessCoord(pipe=0, data=199, model=0): 199, ProcessCoord(pipe=0, data=200, model=0): 200, ProcessCoord(pipe=0, data=201, model=0): 201, ProcessCoord(pipe=0, data=202, model=0): 202, ProcessCoord(pipe=0, data=203, model=0): 203, ProcessCoord(pipe=0, data=204, mode + 0: l=0): 204, ProcessCoord(pipe=0, data=205, model=0): 205, ProcessCoord(pipe=0, data=206, model=0): 206, ProcessCoord(pipe=0, data=207, model=0): 207, ProcessCoord(pipe=0, data=208, model=0): 208, ProcessCoord(pipe=0, data=209, model=0): 209, ProcessCoord(pipe=0, data=210, model=0): 210, ProcessCoord(pipe=0, data=211, model=0): 211, ProcessCoord(pipe=0, data=212, model=0): 212, ProcessCoord(pipe=0, data=213, model=0): 213, ProcessCoord(pipe=0, data=214, model=0): 214, ProcessCoord(pipe=0, data=215, model=0): 215, ProcessCoord(pipe=0, data=216, model=0): 216, ProcessCoord(pipe=0, data=217, model=0): 217, ProcessCoord(pipe=0, data=218, model=0): 218, ProcessCoord(pipe=0, data=219, model=0): 219, ProcessCoord(pipe=0, data=220, model=0): 220, ProcessCoord(pipe=0, data=221, model=0): 221, ProcessCoord(pipe=0, data=222, model=0): 222, ProcessCoord(pipe=0, data=223, model=0): 223, ProcessCoord(pipe=0, data=224, model=0): 224, ProcessCoord(pipe=0, data=225, model=0): 225, ProcessCoord(pipe=0, data=226, model=0): 226, P + 0: rocessCoord(pipe=0, data=227, model=0): 227, ProcessCoord(pipe=0, data=228, model=0): 228, ProcessCoord(pipe=0, data=229, model=0): 229, ProcessCoord(pipe=0, data=230, model=0): 230, ProcessCoord(pipe=0, data=231, model=0): 231, ProcessCoord(pipe=0, data=232, model=0): 232, ProcessCoord(pipe=0, data=233, model=0): 233, ProcessCoord(pipe=0, data=234, model=0): 234, ProcessCoord(pipe=0, data=235, model=0): 235, ProcessCoord(pipe=0, data=236, model=0): 236, ProcessCoord(pipe=0, data=237, model=0): 237, ProcessCoord(pipe=0, data=238, model=0): 238, ProcessCoord(pipe=0, data=239, model=0): 239, ProcessCoord(pipe=0, data=240, model=0): 240, ProcessCoord(pipe=0, data=241, model=0): 241, ProcessCoord(pipe=0, data=242, model=0): 242, ProcessCoord(pipe=0, data=243, model=0): 243, ProcessCoord(pipe=0, data=244, model=0): 244, ProcessCoord(pipe=0, data=245, model=0): 245, ProcessCoord(pipe=0, data=246, model=0): 246, ProcessCoord(pipe=0, data=247, model=0): 247, ProcessCoord(pipe=0, data=248, model=0): 248, ProcessCoord( + 0: pipe=0, data=249, model=0): 249, ProcessCoord(pipe=0, data=250, model=0): 250, ProcessCoord(pipe=0, data=251, model=0): 251, ProcessCoord(pipe=0, data=252, model=0): 252, ProcessCoord(pipe=0, data=253, model=0): 253, ProcessCoord(pipe=0, data=254, model=0): 254, ProcessCoord(pipe=0, data=255, model=0): 255} + 0: [2023-05-13 03:27:52,909] [INFO] [module.py:366:_partition_layers] Partitioning pipeline stages with method type:transformer + 0: stage=0 layers=41 + 0: 0: _to_float16 + 0: 1: EmbeddingPipe + 0: 2: + 0: 3: ParallelTransformerLayerPipe + 0: 4: ParallelTransformerLayerPipe + 0: 5: ParallelTransformerLayerPipe + 0: 6: ParallelTransformerLayerPipe + 0: 7: ParallelTransformerLayerPipe + 0: 8: ParallelTransformerLayerPipe + 0: 9: ParallelTransformerLayerPipe + 0: 10: ParallelTransformerLayerPipe + 0: 11: ParallelTransformerLayerPipe + 0: 12: ParallelTransformerLayerPipe + 0: 13: ParallelTransformerLayerPipe + 0: 14: ParallelTransformerLayerPipe + 0: 15: ParallelTransformerLayerPipe + 0: 16: ParallelTransformerLayerPipe + 0: 17: ParallelTransformerLayerPipe + 0: 18: ParallelTransformerLayerPipe + 0: 19: ParallelTransformerLayerPipe + 0: 20: ParallelTransformerLayerPipe + 0: 21: ParallelTransformerLayerPipe + 0: 22: ParallelTransformerLayerPipe + 0: 23: ParallelTransformerLayerPipe + 0: 24: ParallelTransformerLayerPipe + 0: 25: ParallelTransformerLayerPipe + 0: 26: ParallelTransformerLayerPipe + 0: 27: ParallelTransformerLayerPipe + 0: 28: ParallelTransformerLayerPipe + 0: 29: ParallelTransformerLayerPipe + 0: 30: ParallelTransformerLayerPipe + 0: 31: ParallelTransformerLayerPipe + 0: 32: ParallelTransformerLayerPipe + 0: 33: ParallelTransformerLayerPipe + 0: 34: ParallelTransformerLayerPipe + 0: 35: ParallelTransformerLayerPipe + 0: 36: ParallelTransformerLayerPipe + 0: 37: undo + 0: 38: MixedFusedLayerNorm + 0: 39: EmbeddingPipe + 0: 40: float16_to_fp32 + 0: loss: CrossEntropy + 0: [2023-05-13 03:27:53,518] [INFO] [utils.py:827:see_memory_usage] After Building Model + 0: [2023-05-13 03:27:53,519] [INFO] [utils.py:828:see_memory_usage] MA 5.26 GB Max_MA 5.26 GB CA 5.31 GB Max_CA 5 GB + 0: [2023-05-13 03:27:53,519] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 40.76 GB, percent = 8.1% + 0: setting training iterations to 0 + 0: > learning rate decay style: cosine + 0: DeepSpeed is enabled. + 0: [2023-05-13 03:27:53,521] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed info: version=0.7.5, git-hash=unknown, git-branch=unknown + 0: [2023-05-13 03:28:17,659] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed Flops Profiler Enabled: False + 0: [2023-05-13 03:28:17,659] [INFO] [logging.py:68:log_dist] [Rank 0] Removing param_group that has no 'params' in the client Optimizer + 0: [2023-05-13 03:28:17,660] [INFO] [logging.py:68:log_dist] [Rank 0] Using client Optimizer as basic optimizer + 0: [2023-05-13 03:28:17,679] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed Basic Optimizer = FusedAdam + 0: [2023-05-13 03:28:17,679] [INFO] [logging.py:68:log_dist] [Rank 0] Creating BF16 optimizer + 0: [2023-05-13 03:28:17,805] [INFO] [utils.py:827:see_memory_usage] begin bf16_optimizer + 0: [2023-05-13 03:28:17,805] [INFO] [utils.py:828:see_memory_usage] MA 5.25 GB Max_MA 5.27 GB CA 5.32 GB Max_CA 5 GB + 0: [2023-05-13 03:28:17,805] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 41.48 GB, percent = 8.2% + 0: ninja: no work to do. + 2: Time to load utils op: 0.5143978595733643 seconds + 2: Time to load utils op: 0.5141267776489258 seconds + 2: Time to load utils op: 0.5147995948791504 secondsTime to load utils op: 0.5109837055206299 seconds + 2: + 2: Time to load utils op: 0.5142049789428711 seconds + 2: Time to load utils op: 0.5134398937225342 seconds + 2: Time to load utils op: 0.513641357421875 seconds + 2: Time to load utils op: 0.5140392780303955 seconds +30: Time to load utils op: 0.4775400161743164 secondsTime to load utils op: 0.47826576232910156 seconds +30: +30: Time to load utils op: 0.47828149795532227 seconds +30: Time to load utils op: 0.47878050804138184 seconds +30: Time to load utils op: 0.4791121482849121 seconds +30: Time to load utils op: 0.4781055450439453 seconds +30: Time to load utils op: 0.47879672050476074 seconds +30: Time to load utils op: 0.47881412506103516 seconds +12: Time to load utils op: 0.47573208808898926 seconds +12: Time to load utils op: 0.4757540225982666 seconds +12: Time to load utils op: 0.4757516384124756 seconds + 6: Time to load utils op: 0.5116944313049316 secondsTime to load utils op: 0.5115396976470947 seconds + 6: + 7: Time to load utils op: 0.5095956325531006 seconds + 7: Time to load utils op: 0.5096330642700195 secondsTime to load utils op: 0.5095264911651611 seconds + 7: + 6: Time to load utils op: 0.5119781494140625 seconds +12: Time to load utils op: 0.4758141040802002 seconds +12: Time to load utils op: 0.4758107662200928 seconds + 6: Time to load utils op: 0.5112607479095459 seconds + 6: Time to load utils op: 0.5109653472900391 seconds + 6: Time to load utils op: 0.511533260345459 secondsTime to load utils op: 0.5118067264556885 seconds +12: Time to load utils op: 0.4758303165435791 seconds + 6: Time to load utils op: 0.5112936496734619 seconds + 6: + 7: Time to load utils op: 0.5096590518951416 secondsTime to load utils op: 0.5094242095947266 seconds + 7: + 7: Time to load utils op: 0.5095326900482178 seconds +12: Time to load utils op: 0.4757869243621826 seconds + 7: Time to load utils op: 0.509650468826294 seconds + 7: Time to load utils op: 0.5096375942230225 seconds +12: Time to load utils op: 0.47576189041137695 seconds +29: Time to load utils op: 0.47697019577026367 secondsTime to load utils op: 0.47697997093200684 seconds +29: +29: Time to load utils op: 0.47704601287841797 seconds +29: Time to load utils op: 0.47705745697021484 seconds +29: Time to load utils op: 0.4770627021789551 seconds +29: Time to load utils op: 0.47710490226745605 secondsTime to load utils op: 0.4770934581756592 seconds +29: +29: Time to load utils op: 0.47710561752319336 seconds + 5: Time to load utils op: 0.47803235054016113 seconds + 5: Time to load utils op: 0.4780597686767578 seconds + 5: Time to load utils op: 0.4780552387237549 secondsTime to load utils op: 0.47805094718933105 seconds + 5: + 5: Time to load utils op: 0.4780251979827881 seconds + 5: Time to load utils op: 0.4780604839324951 seconds + 5: Time to load utils op: 0.4781370162963867 seconds + 5: Time to load utils op: 0.47815632820129395 seconds +20: Time to load utils op: 0.49660563468933105 secondsTime to load utils op: 0.49651217460632324 secondsTime to load utils op: 0.4974071979522705 seconds +20: +20: +20: Time to load utils op: 0.49706292152404785 seconds +20: Time to load utils op: 0.49638938903808594 seconds +20: Time to load utils op: 0.49697375297546387 secondsTime to load utils op: 0.4956488609313965 seconds +20: +20: Time to load utils op: 0.4961550235748291 seconds + 8: Time to load utils op: 0.5113966464996338 secondsTime to load utils op: 0.5121603012084961 seconds + 8: + 8: Time to load utils op: 0.5118310451507568 seconds +16: Time to load utils op: 0.5026273727416992 seconds + 8: Time to load utils op: 0.5124025344848633 secondsTime to load utils op: 0.5118842124938965 seconds + 8: + 8: Time to load utils op: 0.5122296810150146 seconds + 8: Time to load utils op: 0.512253999710083 secondsTime to load utils op: 0.5122604370117188 seconds + 8: +16: Time to load utils op: 0.5020544528961182 seconds +16: Time to load utils op: 0.5012655258178711 seconds +16: Time to load utils op: 0.5018854141235352 seconds +16: Time to load utils op: 0.5017557144165039 secondsTime to load utils op: 0.5025818347930908 secondsTime to load utils op: 0.5025808811187744 seconds +16: +16: +16: Time to load utils op: 0.5025143623352051 seconds + 3: Time to load utils op: 0.48209524154663086 seconds + 3: Time to load utils op: 0.482166051864624 seconds + 3: Time to load utils op: 0.4822065830230713 seconds +10: Time to load utils op: 0.48174333572387695 seconds +10: Time to load utils op: 0.4817624092102051 seconds + 3: Time to load utils op: 0.48221659660339355 seconds +15: Time to load utils op: 0.48138880729675293 seconds +15: Time to load utils op: 0.48142218589782715 seconds +15: Time to load utils op: 0.48145103454589844 secondsTime to load utils op: 0.48143434524536133 seconds +15: + 3: Time to load utils op: 0.48229408264160156 seconds + 3: Time to load utils op: 0.4823117256164551 secondsTime to load utils op: 0.4823172092437744 seconds + 3: + 3: Time to load utils op: 0.48233890533447266 seconds +10: Time to load utils op: 0.4817948341369629 seconds +10: Time to load utils op: 0.48171186447143555 seconds +10: Time to load utils op: 0.4819035530090332 seconds +10: Time to load utils op: 0.48187780380249023 seconds +10: Time to load utils op: 0.4818916320800781 seconds +10: Time to load utils op: 0.48192906379699707 seconds +15: Time to load utils op: 0.4819958209991455 secondsTime to load utils op: 0.48200011253356934 secondsTime to load utils op: 0.48200297355651855 seconds +15: +15: +15: Time to load utils op: 0.48200368881225586 seconds +18: Time to load utils op: 0.5032079219818115 seconds +18: Time to load utils op: 0.503704309463501 seconds +18: Time to load utils op: 0.5024158954620361 seconds +18: Time to load utils op: 0.4996788501739502 secondsTime to load utils op: 0.5032501220703125 secondsTime to load utils op: 0.5025887489318848 seconds +18: +18: Time to load utils op: 0.5034165382385254 seconds +18: +18: Time to load utils op: 0.5020840167999268 seconds +11: Time to load utils op: 0.5114877223968506 seconds +11: Time to load utils op: 0.5112924575805664 seconds +11: Time to load utils op: 0.5100851058959961 seconds +11: Time to load utils op: 0.5113010406494141 seconds +11: Time to load utils op: 0.5113680362701416 seconds +11: Time to load utils op: 0.5114920139312744 secondsTime to load utils op: 0.511406421661377 seconds +11: +11: Time to load utils op: 0.5113718509674072 seconds +26: Time to load utils op: 0.4941556453704834 seconds +26: Time to load utils op: 0.4925839900970459 seconds +26: Time to load utils op: 0.49304986000061035 seconds +26: Time to load utils op: 0.49378252029418945 seconds +26: Time to load utils op: 0.4928884506225586 seconds +25: Time to load utils op: 0.48305845260620117 seconds +25: Time to load utils op: 0.4830617904663086 seconds +25: Time to load utils op: 0.48308420181274414 seconds +25: Time to load utils op: 0.48310065269470215 seconds +25: Time to load utils op: 0.4831855297088623 secondsTime to load utils op: 0.4832003116607666 secondsTime to load utils op: 0.4831974506378174 seconds +25: +25: +25: Time to load utils op: 0.48320984840393066 seconds +26: Time to load utils op: 0.4938974380493164 seconds +26: Time to load utils op: 0.49428653717041016 secondsTime to load utils op: 0.4928774833679199 seconds +26: +31: Time to load utils op: 0.4870750904083252 secondsTime to load utils op: 0.4879155158996582 seconds +31: +31: Time to load utils op: 0.48827075958251953 seconds +31: Time to load utils op: 0.4883697032928467 seconds +31: Time to load utils op: 0.4882771968841553 seconds +31: Time to load utils op: 0.48792171478271484 seconds +31: Time to load utils op: 0.48676609992980957 secondsTime to load utils op: 0.4876132011413574 seconds +31: + 4: Time to load utils op: 0.5222346782684326 seconds + 4: Time to load utils op: 0.5214142799377441 seconds + 4: Time to load utils op: 0.522294282913208 seconds + 4: Time to load utils op: 0.5227818489074707 secondsTime to load utils op: 0.5218348503112793 secondsTime to load utils op: 0.521085262298584 seconds + 4: + 4: + 4: Time to load utils op: 0.5225231647491455 seconds + 4: Time to load utils op: 0.5225839614868164 seconds +27: Time to load utils op: 0.4840261936187744 secondsTime to load utils op: 0.48403501510620117 secondsTime to load utils op: 0.4839296340942383 seconds +27: +27: +27: Time to load utils op: 0.48404598236083984 seconds +27: Time to load utils op: 0.48403048515319824 secondsTime to load utils op: 0.48404765129089355 seconds +27: +27: Time to load utils op: 0.48409509658813477 secondsTime to load utils op: 0.48409390449523926 seconds +27: +21: Time to load utils op: 0.4845752716064453 secondsTime to load utils op: 0.48456239700317383 secondsTime to load utils op: 0.48457765579223633 secondsTime to load utils op: 0.48457908630371094 seconds +21: +21: +21: +21: Time to load utils op: 0.484586238861084 seconds +21: Time to load utils op: 0.48459649085998535 secondsTime to load utils op: 0.4846038818359375 seconds +21: Time to load utils op: 0.4846048355102539 seconds +21: +23: Time to load utils op: 0.4984591007232666 secondsTime to load utils op: 0.49843573570251465 seconds +23: + 9: Time to load utils op: 0.5168190002441406 secondsTime to load utils op: 0.5180325508117676 seconds + 9: + 9: Time to load utils op: 0.5167841911315918 secondsTime to load utils op: 0.5177152156829834 seconds +23: Time to load utils op: 0.49897146224975586 seconds +23: Time to load utils op: 0.49927186965942383 seconds +23: Time to load utils op: 0.4984755516052246 secondsTime to load utils op: 0.49768924713134766 seconds +23: +23: Time to load utils op: 0.4985523223876953 seconds +23: Time to load utils op: 0.49851417541503906 seconds + 0: Time to load utils op: 0.5279088020324707 secondsTime to load utils op: 0.4832334518432617 seconds + 0: + 0: Time to load utils op: 0.5267019271850586 seconds + 9: Time to load utils op: 0.5167181491851807 seconds + 9: + 0: Time to load utils op: 0.5270838737487793 seconds + 0: Time to load utils op: 0.5275921821594238 seconds + 9: Time to load utils op: 0.5172631740570068 seconds + 9: Time to load utils op: 0.5170395374298096 seconds + 0: Time to load utils op: 0.528010368347168 seconds + 0: Time to load utils op: 0.5270571708679199 seconds + 9: Time to load utils op: 0.5180461406707764 seconds + 0: Time to load utils op: 0.5274350643157959 seconds +24: Time to load utils op: 0.4987483024597168 seconds +24: Time to load utils op: 0.49871301651000977 seconds +24: Time to load utils op: 0.4996359348297119 seconds +24: Time to load utils op: 0.4997878074645996 seconds +24: Time to load utils op: 0.4984092712402344 seconds +24: Time to load utils op: 0.498854398727417 secondsTime to load utils op: 0.49915027618408203 seconds +24: Time to load utils op: 0.4983694553375244 seconds +24: +28: Time to load utils op: 0.4935004711151123 seconds +28: Time to load utils op: 0.4933907985687256 seconds +28: Time to load utils op: 0.49326610565185547 seconds +28: Time to load utils op: 0.4934074878692627 seconds +28: Time to load utils op: 0.4930586814880371 secondsTime to load utils op: 0.49338221549987793 seconds +28: Time to load utils op: 0.49341535568237305 seconds +28: Time to load utils op: 0.4929969310760498 seconds +28: +22: Time to load utils op: 0.4864346981048584 seconds +22: Time to load utils op: 0.4864504337310791 seconds +22: Time to load utils op: 0.48645853996276855 seconds +22: Time to load utils op: 0.486494779586792 secondsTime to load utils op: 0.4864490032196045 seconds +22: +22: Time to load utils op: 0.48649120330810547 secondsTime to load utils op: 0.4864630699157715 seconds +22: +22: Time to load utils op: 0.4864974021911621 seconds +17: Time to load utils op: 0.48670291900634766 seconds +17: Time to load utils op: 0.48668551445007324 seconds +17: Time to load utils op: 0.48670291900634766 seconds +17: Time to load utils op: 0.48671603202819824 seconds +17: Time to load utils op: 0.4867560863494873 seconds +17: Time to load utils op: 0.4866366386413574 secondsTime to load utils op: 0.4867558479309082 seconds +17: +17: Time to load utils op: 0.48676490783691406 seconds + 1: Time to load utils op: 0.4874730110168457 seconds +19: Time to load utils op: 0.5065085887908936 seconds +19: Time to load utils op: 0.5072846412658691 seconds +19: Time to load utils op: 0.5074098110198975 seconds + 1: Time to load utils op: 0.4876515865325928 seconds + 1: Time to load utils op: 0.4876730442047119 seconds + 1: Time to load utils op: 0.4876720905303955 secondsTime to load utils op: 0.48767614364624023 seconds + 1: + 1: Time to load utils op: 0.4876844882965088 seconds +19: Time to load utils op: 0.5071735382080078 seconds +19: Time to load utils op: 0.5069670677185059 secondsTime to load utils op: 0.5078845024108887 seconds +19: +19: Time to load utils op: 0.5071995258331299 seconds + 1: Time to load utils op: 0.48769593238830566 seconds +19: Time to load utils op: 0.5066444873809814 seconds + 1: Time to load utils op: 0.48770928382873535 seconds +13: Time to load utils op: 0.4875984191894531 seconds +13: Time to load utils op: 0.4876072406768799 seconds +13: Time to load utils op: 0.4876065254211426 seconds +13: Time to load utils op: 0.48755621910095215 seconds +13: Time to load utils op: 0.48768162727355957 secondsTime to load utils op: 0.4876837730407715 seconds +13: +13: Time to load utils op: 0.48766541481018066 seconds +13: Time to load utils op: 0.4876978397369385 seconds +14: Time to load utils op: 0.48810839653015137 seconds +14: Time to load utils op: 0.48813939094543457 seconds +14: Time to load utils op: 0.48817014694213867 seconds +14: Time to load utils op: 0.4881908893585205 seconds +14: Time to load utils op: 0.48816537857055664 secondsTime to load utils op: 0.48819828033447266 seconds +14: +14: Time to load utils op: 0.4882223606109619 seconds +14: Time to load utils op: 0.4882369041442871 seconds + 0: [2023-05-13 03:28:18,406] [INFO] [utils.py:827:see_memory_usage] before initializing group 0 + 0: [2023-05-13 03:28:18,407] [INFO] [utils.py:828:see_memory_usage] MA 5.25 GB Max_MA 5.25 GB CA 5.32 GB Max_CA 5 GB + 0: [2023-05-13 03:28:18,407] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 41.49 GB, percent = 8.2% +30: Time to load utils op: 0.0008175373077392578 seconds +30: Time to load utils op: 0.0008172988891601562 seconds + 6: Time to load utils op: 0.0009222030639648438 seconds +30: Time to load utils op: 0.0013699531555175781 seconds +30: Time to load utils op: 0.0013201236724853516 seconds +30: Time to load utils op: 0.0013499259948730469 seconds +30: Time to load utils op: 0.001310586929321289 secondsTime to load utils op: 0.0013375282287597656 seconds +30: +30: Time to load utils op: 0.001461029052734375 seconds + 6: Time to load utils op: 0.001397848129272461 seconds + 6: Time to load utils op: 0.0013921260833740234 seconds + 6: Time to load utils op: 0.001291513442993164 secondsTime to load utils op: 0.0012803077697753906 seconds + 6: + 6: Time to load utils op: 0.0013322830200195312 seconds + 6: Time to load utils op: 0.0013074874877929688 seconds + 6: Time to load utils op: 0.0013217926025390625 seconds +31: Time to load utils op: 0.0007855892181396484 seconds +31: Time to load utils op: 0.0009267330169677734 seconds +31: Time to load utils op: 0.0008258819580078125 seconds +31: Time to load utils op: 0.0012264251708984375 seconds +31: Time to load utils op: 0.0012307167053222656 seconds +31: Time to load utils op: 0.0012073516845703125 secondsTime to load utils op: 0.0012297630310058594 seconds +31: +31: Time to load utils op: 0.0013473033905029297 seconds + 0: Time to load utils op: 0.0005159378051757812 seconds + 9: Time to load utils op: 0.0008883476257324219 seconds +18: Time to load utils op: 0.0004925727844238281 seconds + 0: Time to load utils op: 0.00047326087951660156 seconds +28: Time to load utils op: 0.0007674694061279297 seconds + 0: Time to load utils op: 0.00040984153747558594 seconds +28: Time to load utils op: 0.0009365081787109375 seconds +28: Time to load utils op: 0.0008385181427001953 seconds + 0: Time to load utils op: 0.00041222572326660156 seconds +18: Time to load utils op: 0.0004494190216064453 secondsTime to load utils op: 0.0004730224609375 seconds +18: +28: Time to load utils op: 0.0009531974792480469 seconds +18: Time to load utils op: 0.00048351287841796875 seconds +18: Time to load utils op: 0.0004913806915283203 secondsTime to load utils op: 0.0004932880401611328 secondsTime to load utils op: 0.0004980564117431641 seconds +18: +18: +18: Time to load utils op: 0.0005860328674316406 seconds + 0: Time to load utils op: 0.00041866302490234375 seconds + 9: Time to load utils op: 0.0012860298156738281 seconds +26: Time to load utils op: 0.0005445480346679688 seconds + 0: Time to load utils op: 0.0004622936248779297 seconds +26: Time to load utils op: 0.0005424022674560547 seconds +28: Time to load utils op: 0.00101470947265625 seconds + 9: Time to load utils op: 0.0012803077697753906 seconds + 9: Time to load utils op: 0.0013318061828613281 secondsTime to load utils op: 0.0012989044189453125 seconds + 9: +26: Time to load utils op: 0.0005390644073486328 seconds + 9: Time to load utils op: 0.0012845993041992188 seconds + 9: Time to load utils op: 0.0012564659118652344 seconds +28: Time to load utils op: 0.0012004375457763672 secondsTime to load utils op: 0.0011932849884033203 seconds +28: +26: Time to load utils op: 0.0005598068237304688 seconds + 9: Time to load utils op: 0.0013210773468017578 seconds +26: Time to load utils op: 0.0005772113800048828 seconds +19: Time to load utils op: 0.0008242130279541016 seconds +28: Time to load utils op: 0.0012552738189697266 seconds +26: Time to load utils op: 0.0006518363952636719 seconds +26: Time to load utils op: 0.0006325244903564453 seconds +26: Time to load utils op: 0.0006215572357177734 seconds +19: Time to load utils op: 0.0011172294616699219 seconds + 0: Time to load utils op: 0.0007083415985107422 seconds +19: Time to load utils op: 0.0011897087097167969 secondsTime to load utils op: 0.0011725425720214844 seconds +19: +19: Time to load utils op: 0.0012230873107910156 seconds +19: Time to load utils op: 0.0013611316680908203 secondsTime to load utils op: 0.0013508796691894531 seconds +19: +19: Time to load utils op: 0.0014355182647705078 seconds +23: Time to load utils op: 0.0004856586456298828 seconds +23: Time to load utils op: 0.00047016143798828125 seconds +23: Time to load utils op: 0.00042629241943359375 secondsTime to load utils op: 0.0004801750183105469 seconds +23: Time to load utils op: 0.00047326087951660156 seconds +23: Time to load utils op: 0.00046944618225097656 seconds +23: Time to load utils op: 0.0004723072052001953 seconds +23: +23: Time to load utils op: 0.0005123615264892578 seconds + 8: Time to load utils op: 0.0006897449493408203 seconds + 8: Time to load utils op: 0.0006585121154785156 seconds + 2: Time to load utils op: 0.0008804798126220703 seconds + 8: Time to load utils op: 0.0008308887481689453 secondsTime to load utils op: 0.0008244514465332031 seconds + 8: + 8: Time to load utils op: 0.0009875297546386719 seconds + 8: Time to load utils op: 0.0010483264923095703 secondsTime to load utils op: 0.000997304916381836 seconds + 8: +24: Time to load utils op: 0.0007841587066650391 seconds + 8: Time to load utils op: 0.0011830329895019531 seconds +24: Time to load utils op: 0.0008680820465087891 seconds +24: Time to load utils op: 0.0010371208190917969 seconds +24: Time to load utils op: 0.0009140968322753906 seconds +24: Time to load utils op: 0.0010275840759277344 seconds + 2: Time to load utils op: 0.0013997554779052734 secondsTime to load utils op: 0.0013687610626220703 seconds + 2: + 2: Time to load utils op: 0.0014834403991699219 seconds + 2: Time to load utils op: 0.0013647079467773438 seconds + 2: Time to load utils op: 0.0014438629150390625 secondsTime to load utils op: 0.0014150142669677734 seconds + 2: +24: Time to load utils op: 0.0012850761413574219 seconds +24: Time to load utils op: 0.0012235641479492188 seconds + 2: Time to load utils op: 0.0014789104461669922 seconds +24: Time to load utils op: 0.001317739486694336 seconds + 4: Time to load utils op: 0.0007197856903076172 seconds + 4: Time to load utils op: 0.0010175704956054688 seconds + 4: Time to load utils op: 0.0012054443359375 seconds + 4: Time to load utils op: 0.0012981891632080078 seconds + 4: Time to load utils op: 0.0012631416320800781 seconds + 4: Time to load utils op: 0.0013427734375 secondsTime to load utils op: 0.0012824535369873047 seconds + 4: + 4: Time to load utils op: 0.0013270378112792969 seconds + 5: Time to load utils op: 0.0014705657958984375 seconds +11: Time to load utils op: 0.0005517005920410156 seconds +12: Time to load utils op: 0.0006613731384277344 seconds + 1: Time to load utils op: 0.0010159015655517578 seconds +12: Time to load utils op: 0.0005955696105957031 seconds +20: Time to load utils op: 0.0009202957153320312 seconds +20: Time to load utils op: 0.0007810592651367188 seconds +20: Time to load utils op: 0.0008618831634521484 seconds +20: Time to load utils op: 0.0008318424224853516 seconds +20: Time to load utils op: 0.0009615421295166016 seconds +20: Time to load utils op: 0.0008842945098876953 secondsTime to load utils op: 0.0008604526519775391 seconds +20: +20: Time to load utils op: 0.0008902549743652344 seconds +25: Time to load utils op: 0.0008425712585449219 seconds +10: Time to load utils op: 0.001169443130493164 seconds +13: Time to load utils op: 0.0012252330780029297 seconds +14: Time to load utils op: 0.0013897418975830078 seconds +10: Time to load utils op: 0.0012829303741455078 seconds +14: Time to load utils op: 0.0014653205871582031 seconds +14: Time to load utils op: 0.0015196800231933594 seconds +22: Time to load utils op: 0.0012285709381103516 seconds +25: Time to load utils op: 0.0013260841369628906 seconds +16: Time to load utils op: 0.0014014244079589844 seconds +22: Time to load utils op: 0.0014095306396484375 seconds +29: Time to load utils op: 0.0022759437561035156 seconds + 5: Time to load utils op: 0.003188610076904297 seconds +17: Time to load utils op: 0.001645803451538086 seconds +21: Time to load utils op: 0.0016891956329345703 seconds + 5: Time to load utils op: 0.0031583309173583984 seconds + 5: Time to load utils op: 0.003195047378540039 secondsTime to load utils op: 0.0032453536987304688 seconds + 5: +13: Time to load utils op: 0.002002239227294922 seconds + 5: Time to load utils op: 0.0032477378845214844 seconds + 5: Time to load utils op: 0.0032846927642822266 secondsTime to load utils op: 0.003262042999267578 seconds + 5: +12: Time to load utils op: 0.0019369125366210938 seconds + 1: Time to load utils op: 0.0025169849395751953 seconds +12: Time to load utils op: 0.0019614696502685547 seconds + 1: Time to load utils op: 0.0024814605712890625 seconds +13: Time to load utils op: 0.0022215843200683594 seconds +29: Time to load utils op: 0.0024483203887939453 seconds + 1: Time to load utils op: 0.0025556087493896484 seconds +27: Time to load utils op: 0.0020062923431396484 seconds +27: Time to load utils op: 0.0019369125366210938 seconds +29: Time to load utils op: 0.002479076385498047 seconds +10: Time to load utils op: 0.0021622180938720703 seconds + 1: Time to load utils op: 0.002498626708984375 seconds +25: Time to load utils op: 0.0019593238830566406 seconds + 1: Time to load utils op: 0.0025000572204589844 seconds +12: Time to load utils op: 0.0019927024841308594 seconds +12: Time to load utils op: 0.001909494400024414 seconds +13: Time to load utils op: 0.0023250579833984375 seconds +12: Time to load utils op: 0.0019958019256591797 seconds +16: Time to load utils op: 0.002103567123413086 seconds +29: Time to load utils op: 0.0025167465209960938 seconds + 1: Time to load utils op: 0.002485990524291992 seconds +11: Time to load utils op: 0.0024220943450927734 secondsTime to load utils op: 0.002541065216064453 seconds +11: +21: Time to load utils op: 0.0021653175354003906 seconds +12: Time to load utils op: 0.001989126205444336 seconds +29: Time to load utils op: 0.002571582794189453 seconds +10: Time to load utils op: 0.0023429393768310547 seconds +10: Time to load utils op: 0.0021753311157226562 seconds +13: Time to load utils op: 0.002560853958129883 seconds +13: Time to load utils op: 0.0024373531341552734 seconds +13: Time to load utils op: 0.002399444580078125 seconds +29: Time to load utils op: 0.0025408267974853516 seconds + 1: Time to load utils op: 0.002567768096923828 seconds +14: Time to load utils op: 0.002283811569213867 seconds +14: Time to load utils op: 0.0023088455200195312 seconds +29: Time to load utils op: 0.002553224563598633 seconds +10: Time to load utils op: 0.002233266830444336 seconds +10: Time to load utils op: 0.002182483673095703 seconds +11: Time to load utils op: 0.0025599002838134766 seconds +11: Time to load utils op: 0.0025293827056884766 seconds +11: Time to load utils op: 0.0024869441986083984 seconds +14: Time to load utils op: 0.0023407936096191406 secondsTime to load utils op: 0.0023949146270751953 seconds +14: +14: Time to load utils op: 0.002332925796508789 seconds +13: Time to load utils op: 0.0025947093963623047 seconds +25: Time to load utils op: 0.0021305084228515625 seconds +29: Time to load utils op: 0.0026602745056152344 seconds +11: Time to load utils op: 0.002471923828125 seconds +17: Time to load utils op: 0.0023040771484375 seconds +22: Time to load utils op: 0.0024123191833496094 seconds +10: Time to load utils op: 0.002161741256713867 seconds +11: Time to load utils op: 0.0025758743286132812 seconds +17: Time to load utils op: 0.002374410629272461 seconds +22: Time to load utils op: 0.002401113510131836 seconds +25: Time to load utils op: 0.002192974090576172 seconds +25: Time to load utils op: 0.002153635025024414 secondsTime to load utils op: 0.002115011215209961 seconds +25: +16: Time to load utils op: 0.0024950504302978516 secondsTime to load utils op: 0.002496004104614258 seconds +16: +16: Time to load utils op: 0.002490520477294922 seconds +16: Time to load utils op: 0.0025315284729003906 seconds +16: Time to load utils op: 0.002424478530883789 seconds +22: Time to load utils op: 0.002372264862060547 seconds +25: Time to load utils op: 0.002250194549560547 seconds +27: Time to load utils op: 0.002272367477416992 seconds +17: Time to load utils op: 0.0022525787353515625 seconds +17: Time to load utils op: 0.002322673797607422 seconds +27: Time to load utils op: 0.0023910999298095703 seconds +17: Time to load utils op: 0.002303600311279297 seconds +21: Time to load utils op: 0.002652883529663086 seconds +21: Time to load utils op: 0.002610445022583008 seconds +16: Time to load utils op: 0.0024678707122802734 seconds +22: Time to load utils op: 0.002345561981201172 seconds +22: Time to load utils op: 0.002290487289428711 seconds +27: Time to load utils op: 0.002371549606323242 seconds +27: Time to load utils op: 0.0023071765899658203 secondsTime to load utils op: 0.0023505687713623047 seconds +27: +27: Time to load utils op: 0.002298116683959961 seconds +17: Time to load utils op: 0.0023953914642333984 seconds +21: Time to load utils op: 0.0026559829711914062 seconds +22: Time to load utils op: 0.0023555755615234375 seconds +17: Time to load utils op: 0.0024068355560302734 seconds +21: Time to load utils op: 0.0026230812072753906 seconds +21: Time to load utils op: 0.002618074417114258 seconds +21: Time to load utils op: 0.002676725387573242 seconds + 0: [2023-05-13 03:28:18,539] [INFO] [utils.py:827:see_memory_usage] after initializing group 0 + 0: [2023-05-13 03:28:18,540] [INFO] [utils.py:828:see_memory_usage] MA 10.64 GB Max_MA 10.64 GB CA 13.39 GB Max_CA 13 GB + 0: [2023-05-13 03:28:18,540] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 41.64 GB, percent = 8.3% +15: Time to load utils op: 0.0009708404541015625 seconds +15: Time to load utils op: 0.0011031627655029297 seconds +15: Time to load utils op: 0.001238107681274414 seconds +15: Time to load utils op: 0.0014445781707763672 seconds +15: Time to load utils op: 0.0015120506286621094 seconds +15: Time to load utils op: 0.001528024673461914 seconds +15: Time to load utils op: 0.0015265941619873047 seconds +15: Time to load utils op: 0.0016226768493652344 seconds + 7: Time to load utils op: 0.0010247230529785156 seconds + 7: Time to load utils op: 0.0014498233795166016 seconds + 7: Time to load utils op: 0.0014464855194091797 secondsTime to load utils op: 0.0014424324035644531 seconds + 7: + 7: Time to load utils op: 0.0014545917510986328 secondsTime to load utils op: 0.0014231204986572266 seconds + 7: + 7: Time to load utils op: 0.0014367103576660156 seconds + 7: Time to load utils op: 0.0014348030090332031 seconds + 3: Time to load utils op: 0.0009450912475585938 seconds + 3: Time to load utils op: 0.0008678436279296875 seconds + 3: Time to load utils op: 0.0008912086486816406 seconds + 3: Time to load utils op: 0.0007946491241455078 seconds + 3: Time to load utils op: 0.0009162425994873047 seconds + 3: Time to load utils op: 0.0009312629699707031 seconds + 3: Time to load utils op: 0.0011191368103027344 seconds + 3: Time to load utils op: 0.0009596347808837891 seconds + 0: [2023-05-13 03:28:18,645] [INFO] [utils.py:827:see_memory_usage] before initializing group 1 + 0: [2023-05-13 03:28:18,646] [INFO] [utils.py:828:see_memory_usage] MA 10.64 GB Max_MA 10.64 GB CA 13.39 GB Max_CA 13 GB + 0: [2023-05-13 03:28:18,646] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 41.64 GB, percent = 8.3% + 0: [2023-05-13 03:28:18,750] [INFO] [utils.py:827:see_memory_usage] after initializing group 1 + 0: [2023-05-13 03:28:18,751] [INFO] [utils.py:828:see_memory_usage] MA 15.73 GB Max_MA 15.73 GB CA 21.01 GB Max_CA 21 GB + 0: [2023-05-13 03:28:18,751] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 41.64 GB, percent = 8.3% + 0: [2023-05-13 03:28:18,852] [INFO] [utils.py:827:see_memory_usage] before initializing group 2 + 0: [2023-05-13 03:28:18,853] [INFO] [utils.py:828:see_memory_usage] MA 15.73 GB Max_MA 15.73 GB CA 21.01 GB Max_CA 21 GB + 0: [2023-05-13 03:28:18,853] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 41.64 GB, percent = 8.3% + 0: [2023-05-13 03:28:18,961] [INFO] [utils.py:827:see_memory_usage] after initializing group 2 + 0: [2023-05-13 03:28:18,961] [INFO] [utils.py:828:see_memory_usage] MA 15.74 GB Max_MA 15.74 GB CA 21.01 GB Max_CA 21 GB + 0: [2023-05-13 03:28:18,962] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 41.64 GB, percent = 8.3% + 0: [2023-05-13 03:28:19,064] [INFO] [utils.py:827:see_memory_usage] before initialize_optimizer + 0: [2023-05-13 03:28:19,064] [INFO] [utils.py:828:see_memory_usage] MA 15.74 GB Max_MA 15.74 GB CA 21.01 GB Max_CA 21 GB + 0: [2023-05-13 03:28:19,065] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 41.64 GB, percent = 8.3% + 0: [2023-05-13 03:28:19,173] [INFO] [utils.py:827:see_memory_usage] end initialize_optimizer + 0: [2023-05-13 03:28:19,173] [INFO] [utils.py:828:see_memory_usage] MA 15.82 GB Max_MA 15.82 GB CA 21.01 GB Max_CA 21 GB + 0: [2023-05-13 03:28:19,174] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 41.64 GB, percent = 8.3% + 0: [2023-05-13 03:28:19,277] [INFO] [utils.py:827:see_memory_usage] end bf16_optimizer + 0: [2023-05-13 03:28:19,278] [INFO] [utils.py:828:see_memory_usage] MA 15.82 GB Max_MA 15.82 GB CA 21.01 GB Max_CA 21 GB + 0: [2023-05-13 03:28:19,278] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 41.64 GB, percent = 8.3% + 0: [2023-05-13 03:28:19,278] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed Final Optimizer = FusedAdam + 0: [2023-05-13 03:28:19,278] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed using client LR scheduler + 0: [2023-05-13 03:28:19,278] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed LR Scheduler = + 0: [2023-05-13 03:28:19,278] [INFO] [logging.py:68:log_dist] [Rank 0] step=0, skipped=0, lr=[0.0002, 0.0002, 0.0002], mom=[(0.9, 0.999), (0.9, 0.999), (0.9, 0.999)] + 0: [2023-05-13 03:28:19,279] [INFO] [config.py:1007:print] DeepSpeedEngine configuration: + 0: [2023-05-13 03:28:19,279] [INFO] [config.py:1011:print] activation_checkpointing_config { + 0: "partition_activations": false, + 0: "contiguous_memory_optimization": false, + 0: "cpu_checkpointing": false, + 0: "number_checkpoints": null, + 0: "synchronize_checkpoint_boundary": false, + 0: "profile": false + 0: } + 0: [2023-05-13 03:28:19,279] [INFO] [config.py:1011:print] aio_config ................... {'block_size': 1048576, 'queue_depth': 8, 'thread_count': 1, 'single_submit': False, 'overlap_events': True} + 0: [2023-05-13 03:28:19,280] [INFO] [config.py:1011:print] amp_enabled .................. False + 0: [2023-05-13 03:28:19,280] [INFO] [config.py:1011:print] amp_params ................... False + 0: [2023-05-13 03:28:19,280] [INFO] [config.py:1011:print] autotuning_config ............ { + 0: "enabled": false, + 0: "start_step": null, + 0: "end_step": null, + 0: "metric_path": null, + 0: "arg_mappings": null, + 0: "metric": "throughput", + 0: "model_info": null, + 0: "results_dir": "/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/autotuning_results", + 0: "exps_dir": "/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/autotuning_exps", + 0: "overwrite": true, + 0: "fast": true, + 0: "start_profile_step": 3, + 0: "end_profile_step": 5, + 0: "tuner_type": "gridsearch", + 0: "tuner_early_stopping": 5, + 0: "tuner_num_trials": 50, + 0: "model_info_path": null, + 0: "mp_size": 1, + 0: "max_train_batch_size": null, + 0: "min_train_batch_size": 1, + 0: "max_train_micro_batch_size_per_gpu": 1.024000e+03, + 0: "min_train_micro_batch_size_per_gpu": 1, + 0: "num_tuning_micro_batch_sizes": 3 + 0: } + 0: [2023-05-13 03:28:19,280] [INFO] [config.py:1011:print] bfloat16_enabled ............. True + 0: [2023-05-13 03:28:19,280] [INFO] [config.py:1011:print] checkpoint_parallel_write_pipeline False + 0: [2023-05-13 03:28:19,280] [INFO] [config.py:1011:print] checkpoint_tag_validation_enabled True + 0: [2023-05-13 03:28:19,280] [INFO] [config.py:1011:print] checkpoint_tag_validation_fail False + 0: [2023-05-13 03:28:19,280] [INFO] [config.py:1011:print] comms_config ................. + 0: [2023-05-13 03:28:19,280] [INFO] [config.py:1011:print] communication_data_type ...... None + 0: [2023-05-13 03:28:19,280] [INFO] [config.py:1011:print] compression_config ........... {'weight_quantization': {'shared_parameters': {'enabled': False, 'quantizer_kernel': False, 'schedule_offset': 0, 'quantize_groups': 1, 'quantize_verbose': False, 'quantization_type': 'symmetric', 'quantize_weight_in_forward': False, 'rounding': 'nearest', 'fp16_mixed_quantize': False, 'quantize_change_ratio': 0.001}, 'different_groups': {}}, 'activation_quantization': {'shared_parameters': {'enabled': False, 'quantization_type': 'symmetric', 'range_calibration': 'dynamic', 'schedule_offset': 1000}, 'different_groups': {}}, 'sparse_pruning': {'shared_parameters': {'enabled': False, 'method': 'l1', 'schedule_offset': 1000}, 'different_groups': {}}, 'row_pruning': {'shared_parameters': {'enabled': False, 'method': 'l1', 'schedule_offset': 1000}, 'different_groups': {}}, 'head_pruning': {'shared_parameters': {'enabled': False, 'method': 'topk', 'schedule_offset': 1000}, 'different_groups': {}}, 'channel_pruning': {'shared_pa + 0: rameters': {'enabled': False, 'method': 'l1', 'schedule_offset': 1000}, 'different_groups': {}}, 'layer_reduction': {'enabled': False}} + 0: [2023-05-13 03:28:19,280] [INFO] [config.py:1011:print] curriculum_enabled ........... False + 0: [2023-05-13 03:28:19,280] [INFO] [config.py:1011:print] curriculum_params ............ False + 0: [2023-05-13 03:28:19,280] [INFO] [config.py:1011:print] dataloader_drop_last ......... False + 0: [2023-05-13 03:28:19,280] [INFO] [config.py:1011:print] disable_allgather ............ False + 0: [2023-05-13 03:28:19,280] [INFO] [config.py:1011:print] dump_state ................... False + 0: [2023-05-13 03:28:19,280] [INFO] [config.py:1011:print] dynamic_loss_scale_args ...... None + 0: [2023-05-13 03:28:19,280] [INFO] [config.py:1011:print] eigenvalue_enabled ........... False + 0: [2023-05-13 03:28:19,280] [INFO] [config.py:1011:print] eigenvalue_gas_boundary_resolution 1 + 0: [2023-05-13 03:28:19,280] [INFO] [config.py:1011:print] eigenvalue_layer_name ........ bert.encoder.layer + 0: [2023-05-13 03:28:19,280] [INFO] [config.py:1011:print] eigenvalue_layer_num ......... 0 + 0: [2023-05-13 03:28:19,280] [INFO] [config.py:1011:print] eigenvalue_max_iter .......... 100 + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] eigenvalue_stability ......... 1e-06 + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] eigenvalue_tol ............... 0.01 + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] eigenvalue_verbose ........... False + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] elasticity_enabled ........... False + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] flops_profiler_config ........ { + 0: "enabled": false, + 0: "profile_step": 1, + 0: "module_depth": -1, + 0: "top_modules": 1, + 0: "detailed": true, + 0: "output_file": null + 0: } + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] fp16_auto_cast ............... None + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] fp16_enabled ................. False + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] fp16_master_weights_and_gradients False + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] global_rank .................. 0 + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] gradient_accumulation_steps .. 1 + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] gradient_clipping ............ 1.0 + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] gradient_predivide_factor .... 1.0 + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] initial_dynamic_scale ........ 1 + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] load_universal_checkpoint .... False + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] loss_scale ................... 1.0 + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] memory_breakdown ............. False + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] monitor_config ............... + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] nebula_config ................ { + 0: "enabled": false, + 0: "persistent_storage_path": null, + 0: "persistent_time_interval": 100, + 0: "num_of_version_in_retention": 2, + 0: "enable_nebula_load": true, + 0: "load_path": null + 0: } + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] optimizer_legacy_fusion ...... False + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] optimizer_name ............... None + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] optimizer_params ............. None + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] pipeline ..................... {'stages': 'auto', 'partition': 'best', 'seed_layers': False, 'activation_checkpoint_interval': 0} + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] pld_enabled .................. False + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] pld_params ................... False + 0: [2023-05-13 03:28:19,281] [INFO] [config.py:1011:print] prescale_gradients ........... False + 0: [2023-05-13 03:28:19,282] [INFO] [config.py:1011:print] scheduler_name ............... None + 0: [2023-05-13 03:28:19,282] [INFO] [config.py:1011:print] scheduler_params ............. None + 0: [2023-05-13 03:28:19,282] [INFO] [config.py:1011:print] sparse_attention ............. None + 0: [2023-05-13 03:28:19,282] [INFO] [config.py:1011:print] sparse_gradients_enabled ..... False + 0: [2023-05-13 03:28:19,282] [INFO] [config.py:1011:print] steps_per_print .............. 2000 + 0: [2023-05-13 03:28:19,282] [INFO] [config.py:1011:print] train_batch_size ............. 512 + 0: [2023-05-13 03:28:19,282] [INFO] [config.py:1011:print] train_micro_batch_size_per_gpu 2 + 0: [2023-05-13 03:28:19,282] [INFO] [config.py:1011:print] use_node_local_storage ....... False + 0: [2023-05-13 03:28:19,282] [INFO] [config.py:1011:print] wall_clock_breakdown ......... False + 0: [2023-05-13 03:28:19,282] [INFO] [config.py:1011:print] world_size ................... 256 + 0: [2023-05-13 03:28:19,282] [INFO] [config.py:1011:print] zero_allow_untested_optimizer False + 0: [2023-05-13 03:28:19,282] [INFO] [config.py:1011:print] zero_config .................. stage=0 contiguous_gradients=True reduce_scatter=True reduce_bucket_size=500000000 allgather_partitions=True allgather_bucket_size=500000000 overlap_comm=False load_from_fp32_weights=True elastic_checkpoint=False offload_param=None offload_optimizer=None sub_group_size=1000000000 cpu_offload_param=None cpu_offload_use_pin_memory=None cpu_offload=None prefetch_bucket_size=50000000 param_persistence_threshold=100000 model_persistence_threshold=9223372036854775807 max_live_parameters=1000000000 max_reuse_distance=1000000000 gather_16bit_weights_on_model_save=False stage3_gather_fp16_weights_on_model_save=False ignore_unused_parameters=True legacy_stage1=False round_robin_gradients=False + 0: [2023-05-13 03:28:19,282] [INFO] [config.py:1011:print] zero_enabled ................. False + 0: [2023-05-13 03:28:19,282] [INFO] [config.py:1011:print] zero_optimization_stage ...... 0 + 0: [2023-05-13 03:28:19,282] [INFO] [config.py:996:print_user_config] json = { + 0: "train_micro_batch_size_per_gpu": 2, + 0: "train_batch_size": 512, + 0: "gradient_clipping": 1.0, + 0: "zero_optimization": { + 0: "stage": 0 + 0: }, + 0: "bf16": { + 0: "enabled": true + 0: }, + 0: "steps_per_print": 2.000000e+03, + 0: "wall_clock_breakdown": false + 0: } + 0: Time to load utils op: 0.00043892860412597656 seconds + 0: [2023-05-13 03:28:19,283] [INFO] [engine.py:87:__init__] CONFIG: micro_batches=1 micro_batch_size=2 + 0: [2023-05-13 03:28:19,358] [INFO] [engine.py:145:__init__] RANK=0 STAGE=0 LAYERS=41 [0, 41) STAGE_PARAMS=2809026560 (2809.027M) TOTAL_PARAMS=2809026560 (2809.027M) UNIQUE_PARAMS=2809026560 (2809.027M) +31: [2023-05-13 03:28:19,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +31: [2023-05-13 03:28:19,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +31: [2023-05-13 03:28:19,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +31: [2023-05-13 03:28:19,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +31: [2023-05-13 03:28:19,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +31: [2023-05-13 03:28:19,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +31: [2023-05-13 03:28:19,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +31: [2023-05-13 03:28:19,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +20: [2023-05-13 03:28:19,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +20: [2023-05-13 03:28:19,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +20: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +20: [2023-05-13 03:28:19,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +20: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +20: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +20: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +20: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 4: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +15: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +15: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +15: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +15: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +15: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +15: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +15: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +12: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +12: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +12: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +12: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +12: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +17: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +12: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +12: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +28: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +10: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +10: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +10: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +10: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +10: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +10: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +10: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +26: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +26: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 4: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 4: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 4: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 4: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 4: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +24: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +24: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +24: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 4: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +24: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +28: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +28: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +28: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +28: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +28: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +17: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +17: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +17: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +17: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +17: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +28: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +17: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +26: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +26: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +26: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +26: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +26: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +24: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +24: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +24: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +30: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 3: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +13: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +15: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +30: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +30: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +30: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +30: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +12: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 3: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +30: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +30: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 3: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 3: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 3: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 3: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 3: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +13: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +13: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +13: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +13: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +13: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +18: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +18: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +18: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +18: [2023-05-13 03:28:19,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +18: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 4: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +13: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +10: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 6: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 6: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +18: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +18: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 5: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 5: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 5: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 5: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 5: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 8: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 8: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +14: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +14: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +14: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +14: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +14: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +17: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +29: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 6: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 6: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 6: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 5: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 5: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 8: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 8: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 8: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 8: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +14: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +14: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +29: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +29: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +29: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +29: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +29: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +19: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +19: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +19: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +28: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 6: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 8: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +29: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 6: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +19: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +19: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +19: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +19: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +11: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +11: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +11: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +11: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +11: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +11: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +11: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +29: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 8: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +24: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +26: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 6: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +16: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +16: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +16: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +16: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +16: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +30: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +16: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +16: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +18: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +27: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 3: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 0: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 5: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +19: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +14: [2023-05-13 03:28:19,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +13: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +21: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +22: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +22: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +22: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +22: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +22: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +21: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +22: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 0: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 1: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +21: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +22: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 0: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 9: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 0: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +11: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 1: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +23: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +23: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +27: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 1: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 1: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 1: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 1: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 1: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +21: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +21: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +21: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +22: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +25: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +25: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +25: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +25: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +25: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 0: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 0: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 0: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +23: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +23: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +23: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +25: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +25: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 9: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 9: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 9: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 9: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 9: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +16: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +23: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +23: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 7: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 7: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +25: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 9: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +27: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 2: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 2: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 2: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 2: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 2: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 9: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +27: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +27: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 2: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 1: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 7: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 7: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 7: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 7: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +21: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +27: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +27: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 7: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +23: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +21: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 7: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +27: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 0: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 2: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 2: [2023-05-13 03:28:19,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +31: [2023-05-13 03:28:19,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +31: [2023-05-13 03:28:19,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +31: [2023-05-13 03:28:19,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +31: [2023-05-13 03:28:19,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +31: [2023-05-13 03:28:19,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +31: [2023-05-13 03:28:19,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +31: [2023-05-13 03:28:19,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +31: [2023-05-13 03:28:19,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +31: [2023-05-13 03:28:19,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +31: [2023-05-13 03:28:19,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +31: [2023-05-13 03:28:19,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +31: [2023-05-13 03:28:19,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +31: [2023-05-13 03:28:19,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +31: [2023-05-13 03:28:19,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +31: [2023-05-13 03:28:19,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +31: [2023-05-13 03:28:19,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +31: [2023-05-13 03:28:19,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +31: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +31: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 4: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 4: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 4: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 4: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 4: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 4: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +31: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 4: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 4: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 4: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 4: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 4: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 4: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +31: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 4: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 4: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 4: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +31: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 4: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +31: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +31: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +31: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +31: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +31: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +31: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +31: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +31: [2023-05-13 03:28:19,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +31: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +31: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 4: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 4: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +28: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +28: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +28: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +28: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +28: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +28: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +28: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +28: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +28: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +28: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +28: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 4: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +28: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +28: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +28: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +28: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 4: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 4: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +28: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 4: [2023-05-13 03:28:19,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 4: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 4: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 4: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 4: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +18: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +18: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +18: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +18: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +18: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +18: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +18: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 4: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +18: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +18: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +18: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +18: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +18: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +18: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +18: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +29: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +29: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +18: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 4: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +29: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +29: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +29: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 4: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +15: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +15: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +15: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +15: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +15: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +12: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +12: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +12: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +29: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +29: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 4: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +18: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +15: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +12: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +12: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +12: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +12: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +15: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +12: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +12: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +12: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +29: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +29: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 4: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +15: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +15: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +15: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +12: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +12: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +12: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +12: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +29: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +29: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +29: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +29: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +29: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +15: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +15: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +15: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +15: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +29: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +12: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 4: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +15: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +12: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +29: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +15: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 8: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 8: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 8: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 8: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 8: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 8: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 8: [2023-05-13 03:28:19,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 8: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 8: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 8: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 8: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +19: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +19: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +19: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +19: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +19: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 8: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 8: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 6: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 6: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 6: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 8: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +19: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +19: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +19: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +28: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 6: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 6: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 6: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 6: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +19: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +19: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 6: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 6: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 6: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 8: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +19: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +10: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +10: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +10: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 8: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +19: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +19: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +19: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 6: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 6: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 6: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +10: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +10: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +10: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +19: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +28: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +10: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 6: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +10: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +10: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 6: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 3: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 3: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 3: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +19: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +10: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 3: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 3: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 3: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 3: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +10: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +10: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +28: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +10: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +10: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 3: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 3: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 3: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +13: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +13: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +13: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +13: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 3: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 3: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 3: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 3: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 3: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +10: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 6: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +28: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +10: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +13: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +13: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +13: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +13: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +13: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +13: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +13: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +24: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +24: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +24: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +24: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +24: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 3: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +18: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +13: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +13: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +13: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +24: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +24: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +13: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +24: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +24: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +24: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +24: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +24: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +28: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +20: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +20: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +20: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +20: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +20: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +18: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +24: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +13: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +24: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +28: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +20: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +20: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +23: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +23: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +23: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +23: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +23: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +24: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +29: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +20: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +20: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +20: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +20: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +20: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +28: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +20: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +23: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +23: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +28: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +20: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +23: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +23: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +23: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +24: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +12: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +20: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +23: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +23: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +23: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +23: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +18: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +20: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +15: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +23: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +29: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +28: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +28: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +18: [2023-05-13 03:28:19,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +23: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +12: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +28: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +28: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +15: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +18: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +18: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +29: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +29: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +12: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +28: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +28: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +29: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 8: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +15: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +28: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +18: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +18: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +12: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +29: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +28: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +15: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +30: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +30: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +30: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +30: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +30: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +19: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +18: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 0: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 8: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +14: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +14: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +14: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +14: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +14: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +12: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +30: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +29: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +19: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 6: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 0: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 0: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 0: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 0: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 5: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 5: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 5: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 5: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +14: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +14: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +15: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +15: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +30: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +29: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 3: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +19: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +10: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +18: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 0: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 5: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 8: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +14: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +14: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +15: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +12: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +30: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 6: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +18: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 5: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 9: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 9: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 9: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 9: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 9: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +14: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +14: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +12: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +30: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +30: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +26: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +26: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +29: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +10: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 6: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +18: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 5: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 8: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +14: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +13: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +13: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +17: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +17: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +17: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +17: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +17: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +15: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +12: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +12: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +25: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +25: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +25: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +25: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +30: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +30: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +29: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +29: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +29: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 3: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +19: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 0: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 5: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 5: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 8: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 9: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 9: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +14: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +14: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +13: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +15: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +25: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +25: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +30: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +26: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 3: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +19: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +10: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 6: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +18: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +18: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 0: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 5: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 5: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 5: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 5: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 8: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 9: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 9: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 9: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +14: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +17: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +17: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +15: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +15: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +12: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +23: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +25: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +30: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +26: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +26: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +26: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +26: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +29: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 3: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +19: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 6: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +18: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 5: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 8: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +14: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +13: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +17: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +17: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +17: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +12: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +25: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +25: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +25: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +25: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +25: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +30: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +26: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +26: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +29: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 3: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +19: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +19: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +10: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +10: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 6: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +18: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 2: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 2: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 2: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 2: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 2: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 5: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 8: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +17: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +17: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +17: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +15: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +12: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +20: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +23: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +23: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +25: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +30: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 3: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +10: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 0: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 5: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 8: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 9: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 9: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +13: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +13: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +17: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +15: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +12: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +23: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +25: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +26: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +26: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +26: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +26: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +29: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +19: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 6: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 0: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 2: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 8: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +17: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +15: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +20: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +23: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +23: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +23: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +25: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +26: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +26: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +29: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 3: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +19: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +10: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 6: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 6: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 2: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 1: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 1: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 1: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 1: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 1: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 8: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:19,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +13: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +15: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +12: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +25: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +24: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +26: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 3: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +10: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +10: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 6: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 6: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 2: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 2: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 2: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 2: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 2: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 1: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 1: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 8: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +17: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +12: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +20: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +20: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 3: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +19: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +19: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 2: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 1: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 1: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 1: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +13: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +15: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +12: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +19: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +10: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 2: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 2: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 1: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 1: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 8: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 8: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +20: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +20: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 3: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 3: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 1: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 1: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 8: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 8: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +24: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 3: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +19: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +10: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 2: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 1: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +13: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +20: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +23: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 3: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +10: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 1: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +19: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +10: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +13: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +20: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +24: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 3: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +19: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +13: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +10: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +11: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +11: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +11: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +11: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +11: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +14: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 3: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +10: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 5: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +13: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +13: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +21: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +21: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +21: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +10: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +11: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +11: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +14: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +13: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +27: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +27: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +27: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 3: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +21: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +21: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +20: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +20: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +11: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +11: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +11: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +11: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +14: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +13: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +21: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +21: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +24: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +27: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +27: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +27: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 0: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +11: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +11: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +23: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +27: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 0: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +11: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +11: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +21: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +21: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +21: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +21: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +27: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +27: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +27: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 0: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +21: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +20: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +20: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +24: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 0: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +11: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +13: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +21: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +25: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +27: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +27: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +27: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +27: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +21: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +20: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +20: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +27: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 0: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 5: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +14: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +21: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +17: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +17: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +20: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +24: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +27: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +21: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +25: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +14: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +24: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 5: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +24: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +20: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +23: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +25: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +25: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +24: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +14: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +24: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 7: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 7: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 7: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 7: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 7: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +23: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +25: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +23: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +24: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 5: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 7: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 7: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +17: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +23: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +26: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 9: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +16: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +16: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +16: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +16: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +23: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 5: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 7: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 7: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +25: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 5: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 9: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +16: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +16: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +16: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +24: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 5: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 7: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 7: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 7: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 7: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 7: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +14: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +23: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +23: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +25: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 7: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +16: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +16: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +16: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +30: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 5: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 5: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 1: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +14: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +17: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +16: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +25: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +24: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 7: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 9: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +14: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +25: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +25: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +26: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 5: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 5: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 1: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +16: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +25: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +25: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +14: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +16: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 0: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 5: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +14: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +14: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +14: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +16: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +16: [2023-05-13 03:28:19,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +25: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +14: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +17: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +24: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 5: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 1: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 9: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +25: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +24: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 5: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +14: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +17: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +16: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 0: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 1: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +22: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +22: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +22: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +22: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +22: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +25: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +24: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +26: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 0: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 5: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +22: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +22: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +25: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 1: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +21: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +26: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 5: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +14: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 9: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +22: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +22: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +22: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +22: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +22: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +30: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +26: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 1: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 1: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +17: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +21: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +22: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +22: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +22: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... + 1: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +26: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 1: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +17: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +22: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt... +27: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 1: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 9: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 1: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +17: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +21: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 9: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +21: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +30: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +27: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 1: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +17: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +30: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +30: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +26: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 0: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 1: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +17: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +27: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +27: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +26: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 9: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +21: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +30: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +27: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +30: [2023-05-13 03:28:19,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 1: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 1: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +27: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +21: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +26: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +26: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +17: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +21: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +26: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 2: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 1: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +30: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +26: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +21: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +21: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +27: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +27: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 9: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +21: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +17: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +21: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +30: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +27: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 7: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +21: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +21: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 2: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +30: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +27: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +27: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +27: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +17: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 7: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +27: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +26: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +11: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +27: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 2: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +26: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +21: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +30: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 2: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +26: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +27: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +27: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +26: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +30: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 2: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 7: [2023-05-13 03:28:19,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +11: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +21: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 2: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +11: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 7: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 7: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +16: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +30: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +30: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +11: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 7: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +21: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +17: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 7: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +17: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 2: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 2: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 7: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +16: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +30: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 2: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +11: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 2: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +11: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +30: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +16: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +16: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 7: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +11: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +11: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 7: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 7: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 2: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 2: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 7: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 7: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +11: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 2: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 2: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +11: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +16: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +11: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +16: [2023-05-13 03:28:19,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. + 7: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +11: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +16: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +16: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 2: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +16: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +22: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +11: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 2: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 7: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +16: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 7: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +16: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +22: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +11: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +16: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +22: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +11: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +11: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +22: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +22: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +16: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +22: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +22: [2023-05-13 03:28:19,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +16: [2023-05-13 03:28:19,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +16: [2023-05-13 03:28:19,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +22: [2023-05-13 03:28:19,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/mp_rank_00_model_states.pt. +22: [2023-05-13 03:28:19,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +22: [2023-05-13 03:28:19,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +16: [2023-05-13 03:28:19,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +22: [2023-05-13 03:28:19,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +22: [2023-05-13 03:28:19,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +22: [2023-05-13 03:28:19,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +22: [2023-05-13 03:28:19,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +22: [2023-05-13 03:28:19,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +22: [2023-05-13 03:28:19,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 6: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 6: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 6: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 6: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 6: [2023-05-13 03:28:19,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +23: [2023-05-13 03:28:19,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +23: [2023-05-13 03:28:19,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +23: [2023-05-13 03:28:19,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +23: [2023-05-13 03:28:19,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +23: [2023-05-13 03:28:19,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +23: [2023-05-13 03:28:19,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +23: [2023-05-13 03:28:19,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +23: [2023-05-13 03:28:19,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +23: [2023-05-13 03:28:19,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +23: [2023-05-13 03:28:19,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +23: [2023-05-13 03:28:19,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +23: [2023-05-13 03:28:19,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +23: [2023-05-13 03:28:19,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +23: [2023-05-13 03:28:19,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +23: [2023-05-13 03:28:19,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +23: [2023-05-13 03:28:19,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 3: [2023-05-13 03:28:20,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +15: [2023-05-13 03:28:20,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 3: [2023-05-13 03:28:20,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 3: [2023-05-13 03:28:20,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 3: [2023-05-13 03:28:20,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 3: [2023-05-13 03:28:20,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 3: [2023-05-13 03:28:20,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 3: [2023-05-13 03:28:20,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +15: [2023-05-13 03:28:20,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +15: [2023-05-13 03:28:20,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +15: [2023-05-13 03:28:20,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +15: [2023-05-13 03:28:20,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +15: [2023-05-13 03:28:20,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +15: [2023-05-13 03:28:20,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +15: [2023-05-13 03:28:20,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 3: [2023-05-13 03:28:20,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +15: [2023-05-13 03:28:20,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +29: [2023-05-13 03:28:20,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +29: [2023-05-13 03:28:20,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +29: [2023-05-13 03:28:20,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +29: [2023-05-13 03:28:20,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +29: [2023-05-13 03:28:20,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +29: [2023-05-13 03:28:20,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +29: [2023-05-13 03:28:20,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +29: [2023-05-13 03:28:20,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +29: [2023-05-13 03:28:20,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +29: [2023-05-13 03:28:20,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +15: [2023-05-13 03:28:20,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 3: [2023-05-13 03:28:20,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +15: [2023-05-13 03:28:20,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +15: [2023-05-13 03:28:20,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +24: [2023-05-13 03:28:20,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +24: [2023-05-13 03:28:20,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +15: [2023-05-13 03:28:20,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +15: [2023-05-13 03:28:20,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +15: [2023-05-13 03:28:20,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +15: [2023-05-13 03:28:20,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +20: [2023-05-13 03:28:20,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +20: [2023-05-13 03:28:20,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +20: [2023-05-13 03:28:20,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +20: [2023-05-13 03:28:20,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +20: [2023-05-13 03:28:20,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +20: [2023-05-13 03:28:20,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +23: [2023-05-13 03:28:20,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +20: [2023-05-13 03:28:20,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +24: [2023-05-13 03:28:20,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +24: [2023-05-13 03:28:20,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +24: [2023-05-13 03:28:20,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +24: [2023-05-13 03:28:20,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +24: [2023-05-13 03:28:20,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +20: [2023-05-13 03:28:20,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +24: [2023-05-13 03:28:20,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +29: [2023-05-13 03:28:20,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +29: [2023-05-13 03:28:20,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +29: [2023-05-13 03:28:20,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +29: [2023-05-13 03:28:20,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +29: [2023-05-13 03:28:20,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +23: [2023-05-13 03:28:20,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +29: [2023-05-13 03:28:20,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +24: [2023-05-13 03:28:20,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +24: [2023-05-13 03:28:20,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +20: [2023-05-13 03:28:20,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +24: [2023-05-13 03:28:20,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +24: [2023-05-13 03:28:20,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +24: [2023-05-13 03:28:20,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +24: [2023-05-13 03:28:20,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +20: [2023-05-13 03:28:20,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +24: [2023-05-13 03:28:20,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +24: [2023-05-13 03:28:20,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +20: [2023-05-13 03:28:20,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +20: [2023-05-13 03:28:20,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +20: [2023-05-13 03:28:20,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +20: [2023-05-13 03:28:20,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +20: [2023-05-13 03:28:20,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +20: [2023-05-13 03:28:20,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +26: [2023-05-13 03:28:20,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +26: [2023-05-13 03:28:20,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +10: [2023-05-13 03:28:20,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +10: [2023-05-13 03:28:20,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +26: [2023-05-13 03:28:20,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +26: [2023-05-13 03:28:20,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +26: [2023-05-13 03:28:20,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +26: [2023-05-13 03:28:20,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +26: [2023-05-13 03:28:20,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +26: [2023-05-13 03:28:20,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +23: [2023-05-13 03:28:20,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +23: [2023-05-13 03:28:20,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +23: [2023-05-13 03:28:20,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +10: [2023-05-13 03:28:20,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +23: [2023-05-13 03:28:20,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +23: [2023-05-13 03:28:20,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +23: [2023-05-13 03:28:20,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +10: [2023-05-13 03:28:20,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +26: [2023-05-13 03:28:20,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +26: [2023-05-13 03:28:20,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +21: [2023-05-13 03:28:20,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +21: [2023-05-13 03:28:20,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +21: [2023-05-13 03:28:20,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +21: [2023-05-13 03:28:20,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +21: [2023-05-13 03:28:20,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +21: [2023-05-13 03:28:20,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +21: [2023-05-13 03:28:20,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +21: [2023-05-13 03:28:20,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +25: [2023-05-13 03:28:20,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +25: [2023-05-13 03:28:20,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +25: [2023-05-13 03:28:20,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +26: [2023-05-13 03:28:20,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +26: [2023-05-13 03:28:20,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +26: [2023-05-13 03:28:20,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +25: [2023-05-13 03:28:20,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +10: [2023-05-13 03:28:20,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +10: [2023-05-13 03:28:20,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +25: [2023-05-13 03:28:20,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +10: [2023-05-13 03:28:20,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +10: [2023-05-13 03:28:20,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +10: [2023-05-13 03:28:20,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +10: [2023-05-13 03:28:20,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +26: [2023-05-13 03:28:20,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +25: [2023-05-13 03:28:20,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +26: [2023-05-13 03:28:20,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +11: [2023-05-13 03:28:20,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +11: [2023-05-13 03:28:20,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +26: [2023-05-13 03:28:20,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 8: [2023-05-13 03:28:20,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 8: [2023-05-13 03:28:20,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 8: [2023-05-13 03:28:20,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +10: [2023-05-13 03:28:20,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +21: [2023-05-13 03:28:20,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +21: [2023-05-13 03:28:20,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +21: [2023-05-13 03:28:20,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 8: [2023-05-13 03:28:20,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +11: [2023-05-13 03:28:20,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +11: [2023-05-13 03:28:20,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +11: [2023-05-13 03:28:20,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +11: [2023-05-13 03:28:20,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +11: [2023-05-13 03:28:20,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +11: [2023-05-13 03:28:20,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +11: [2023-05-13 03:28:20,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +11: [2023-05-13 03:28:20,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +10: [2023-05-13 03:28:20,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +10: [2023-05-13 03:28:20,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +10: [2023-05-13 03:28:20,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +10: [2023-05-13 03:28:20,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +21: [2023-05-13 03:28:20,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +10: [2023-05-13 03:28:20,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +21: [2023-05-13 03:28:20,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +23: [2023-05-13 03:28:20,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +23: [2023-05-13 03:28:20,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +21: [2023-05-13 03:28:20,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +21: [2023-05-13 03:28:20,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 8: [2023-05-13 03:28:20,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +21: [2023-05-13 03:28:20,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 8: [2023-05-13 03:28:20,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +14: [2023-05-13 03:28:20,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +14: [2023-05-13 03:28:20,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +19: [2023-05-13 03:28:20,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +19: [2023-05-13 03:28:20,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 8: [2023-05-13 03:28:20,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +15: [2023-05-13 03:28:20,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +14: [2023-05-13 03:28:20,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +14: [2023-05-13 03:28:20,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +14: [2023-05-13 03:28:20,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +14: [2023-05-13 03:28:20,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +14: [2023-05-13 03:28:20,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +14: [2023-05-13 03:28:20,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +19: [2023-05-13 03:28:20,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +19: [2023-05-13 03:28:20,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +19: [2023-05-13 03:28:20,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +19: [2023-05-13 03:28:20,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 3: [2023-05-13 03:28:20,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 3: [2023-05-13 03:28:20,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +19: [2023-05-13 03:28:20,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +19: [2023-05-13 03:28:20,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +18: [2023-05-13 03:28:20,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +11: [2023-05-13 03:28:20,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +23: [2023-05-13 03:28:20,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +29: [2023-05-13 03:28:20,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +18: [2023-05-13 03:28:20,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +29: [2023-05-13 03:28:20,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +11: [2023-05-13 03:28:20,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +11: [2023-05-13 03:28:20,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +11: [2023-05-13 03:28:20,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +14: [2023-05-13 03:28:20,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +11: [2023-05-13 03:28:20,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +23: [2023-05-13 03:28:20,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +14: [2023-05-13 03:28:20,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +18: [2023-05-13 03:28:20,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +18: [2023-05-13 03:28:20,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +18: [2023-05-13 03:28:20,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +18: [2023-05-13 03:28:20,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +18: [2023-05-13 03:28:20,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +11: [2023-05-13 03:28:20,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +18: [2023-05-13 03:28:20,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +23: [2023-05-13 03:28:20,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +23: [2023-05-13 03:28:20,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +19: [2023-05-13 03:28:20,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +19: [2023-05-13 03:28:20,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +23: [2023-05-13 03:28:20,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +23: [2023-05-13 03:28:20,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +14: [2023-05-13 03:28:20,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +28: [2023-05-13 03:28:20,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +28: [2023-05-13 03:28:20,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +28: [2023-05-13 03:28:20,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +28: [2023-05-13 03:28:20,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +28: [2023-05-13 03:28:20,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +28: [2023-05-13 03:28:20,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +28: [2023-05-13 03:28:20,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +19: [2023-05-13 03:28:20,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +19: [2023-05-13 03:28:20,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +14: [2023-05-13 03:28:20,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +14: [2023-05-13 03:28:20,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +28: [2023-05-13 03:28:20,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +18: [2023-05-13 03:28:20,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +19: [2023-05-13 03:28:20,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +14: [2023-05-13 03:28:20,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +18: [2023-05-13 03:28:20,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +14: [2023-05-13 03:28:20,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +14: [2023-05-13 03:28:20,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +19: [2023-05-13 03:28:20,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +19: [2023-05-13 03:28:20,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +19: [2023-05-13 03:28:20,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +18: [2023-05-13 03:28:20,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +18: [2023-05-13 03:28:20,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +28: [2023-05-13 03:28:20,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +18: [2023-05-13 03:28:20,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +18: [2023-05-13 03:28:20,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +18: [2023-05-13 03:28:20,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +13: [2023-05-13 03:28:20,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +13: [2023-05-13 03:28:20,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +18: [2023-05-13 03:28:20,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +30: [2023-05-13 03:28:20,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +30: [2023-05-13 03:28:20,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +13: [2023-05-13 03:28:20,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +13: [2023-05-13 03:28:20,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +13: [2023-05-13 03:28:20,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +13: [2023-05-13 03:28:20,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +13: [2023-05-13 03:28:20,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +30: [2023-05-13 03:28:20,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +30: [2023-05-13 03:28:20,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +30: [2023-05-13 03:28:20,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +30: [2023-05-13 03:28:20,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +30: [2023-05-13 03:28:20,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +13: [2023-05-13 03:28:20,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +30: [2023-05-13 03:28:20,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +13: [2023-05-13 03:28:20,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +13: [2023-05-13 03:28:20,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +29: [2023-05-13 03:28:20,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +29: [2023-05-13 03:28:20,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +20: [2023-05-13 03:28:20,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +20: [2023-05-13 03:28:20,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +28: [2023-05-13 03:28:20,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +28: [2023-05-13 03:28:20,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +15: [2023-05-13 03:28:20,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +28: [2023-05-13 03:28:20,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +28: [2023-05-13 03:28:20,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +13: [2023-05-13 03:28:20,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +28: [2023-05-13 03:28:20,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +30: [2023-05-13 03:28:20,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +28: [2023-05-13 03:28:20,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +28: [2023-05-13 03:28:20,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 3: [2023-05-13 03:28:20,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 3: [2023-05-13 03:28:20,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 3: [2023-05-13 03:28:20,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +24: [2023-05-13 03:28:20,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +24: [2023-05-13 03:28:20,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +30: [2023-05-13 03:28:20,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +30: [2023-05-13 03:28:20,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +30: [2023-05-13 03:28:20,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +29: [2023-05-13 03:28:20,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +30: [2023-05-13 03:28:20,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +24: [2023-05-13 03:28:20,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +24: [2023-05-13 03:28:20,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +24: [2023-05-13 03:28:20,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +29: [2023-05-13 03:28:20,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +24: [2023-05-13 03:28:20,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +30: [2023-05-13 03:28:20,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 6: [2023-05-13 03:28:20,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +13: [2023-05-13 03:28:20,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +30: [2023-05-13 03:28:20,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +13: [2023-05-13 03:28:20,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +13: [2023-05-13 03:28:20,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +13: [2023-05-13 03:28:20,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +13: [2023-05-13 03:28:20,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +15: [2023-05-13 03:28:20,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +15: [2023-05-13 03:28:20,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +15: [2023-05-13 03:28:20,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 6: [2023-05-13 03:28:20,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 6: [2023-05-13 03:28:20,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 6: [2023-05-13 03:28:20,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 6: [2023-05-13 03:28:20,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 6: [2023-05-13 03:28:20,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 6: [2023-05-13 03:28:20,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +15: [2023-05-13 03:28:20,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +29: [2023-05-13 03:28:20,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +29: [2023-05-13 03:28:20,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +29: [2023-05-13 03:28:20,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +29: [2023-05-13 03:28:20,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +30: [2023-05-13 03:28:20,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +12: [2023-05-13 03:28:20,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +12: [2023-05-13 03:28:20,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +12: [2023-05-13 03:28:20,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +12: [2023-05-13 03:28:20,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +12: [2023-05-13 03:28:20,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +12: [2023-05-13 03:28:20,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +12: [2023-05-13 03:28:20,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +12: [2023-05-13 03:28:20,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +10: [2023-05-13 03:28:20,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +24: [2023-05-13 03:28:20,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +24: [2023-05-13 03:28:20,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 6: [2023-05-13 03:28:20,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +15: [2023-05-13 03:28:20,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +15: [2023-05-13 03:28:20,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +15: [2023-05-13 03:28:20,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +12: [2023-05-13 03:28:20,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +12: [2023-05-13 03:28:20,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +12: [2023-05-13 03:28:20,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +12: [2023-05-13 03:28:20,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +12: [2023-05-13 03:28:20,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +26: [2023-05-13 03:28:20,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +26: [2023-05-13 03:28:20,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +26: [2023-05-13 03:28:20,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +12: [2023-05-13 03:28:20,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +12: [2023-05-13 03:28:20,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +12: [2023-05-13 03:28:20,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +20: [2023-05-13 03:28:20,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +20: [2023-05-13 03:28:20,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +20: [2023-05-13 03:28:20,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 6: [2023-05-13 03:28:20,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 8: [2023-05-13 03:28:20,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +21: [2023-05-13 03:28:20,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +21: [2023-05-13 03:28:20,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +21: [2023-05-13 03:28:20,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +11: [2023-05-13 03:28:20,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +10: [2023-05-13 03:28:20,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +26: [2023-05-13 03:28:20,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +26: [2023-05-13 03:28:20,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +20: [2023-05-13 03:28:20,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +20: [2023-05-13 03:28:20,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +20: [2023-05-13 03:28:20,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +10: [2023-05-13 03:28:20,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +29: [2023-05-13 03:28:20,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +26: [2023-05-13 03:28:20,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +24: [2023-05-13 03:28:20,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +26: [2023-05-13 03:28:20,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +24: [2023-05-13 03:28:20,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +24: [2023-05-13 03:28:20,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +20: [2023-05-13 03:28:20,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +20: [2023-05-13 03:28:20,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 3: [2023-05-13 03:28:20,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +29: [2023-05-13 03:28:20,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +24: [2023-05-13 03:28:20,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +24: [2023-05-13 03:28:20,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +24: [2023-05-13 03:28:20,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +24: [2023-05-13 03:28:20,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +25: [2023-05-13 03:28:20,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +29: [2023-05-13 03:28:20,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +29: [2023-05-13 03:28:20,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +21: [2023-05-13 03:28:20,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +21: [2023-05-13 03:28:20,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +29: [2023-05-13 03:28:20,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +10: [2023-05-13 03:28:20,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +26: [2023-05-13 03:28:20,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +15: [2023-05-13 03:28:20,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +25: [2023-05-13 03:28:20,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +24: [2023-05-13 03:28:20,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +10: [2023-05-13 03:28:20,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +29: [2023-05-13 03:28:20,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +31: [2023-05-13 03:28:20,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +31: [2023-05-13 03:28:20,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +31: [2023-05-13 03:28:20,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +31: [2023-05-13 03:28:20,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +31: [2023-05-13 03:28:20,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +31: [2023-05-13 03:28:20,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +31: [2023-05-13 03:28:20,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +31: [2023-05-13 03:28:20,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +15: [2023-05-13 03:28:20,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +21: [2023-05-13 03:28:20,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +21: [2023-05-13 03:28:20,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +21: [2023-05-13 03:28:20,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +15: [2023-05-13 03:28:20,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +15: [2023-05-13 03:28:20,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +11: [2023-05-13 03:28:20,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +15: [2023-05-13 03:28:20,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +26: [2023-05-13 03:28:20,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +26: [2023-05-13 03:28:20,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 8: [2023-05-13 03:28:20,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +15: [2023-05-13 03:28:20,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +17: [2023-05-13 03:28:20,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +17: [2023-05-13 03:28:20,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +17: [2023-05-13 03:28:20,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +17: [2023-05-13 03:28:20,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +18: [2023-05-13 03:28:20,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +18: [2023-05-13 03:28:20,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +17: [2023-05-13 03:28:20,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +31: [2023-05-13 03:28:20,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +31: [2023-05-13 03:28:20,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +28: [2023-05-13 03:28:20,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +18: [2023-05-13 03:28:20,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +21: [2023-05-13 03:28:20,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +15: [2023-05-13 03:28:20,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +14: [2023-05-13 03:28:20,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +14: [2023-05-13 03:28:20,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +14: [2023-05-13 03:28:20,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +26: [2023-05-13 03:28:20,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +21: [2023-05-13 03:28:20,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +10: [2023-05-13 03:28:20,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +21: [2023-05-13 03:28:20,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +20: [2023-05-13 03:28:20,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +10: [2023-05-13 03:28:20,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +10: [2023-05-13 03:28:20,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +10: [2023-05-13 03:28:20,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +26: [2023-05-13 03:28:20,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +20: [2023-05-13 03:28:20,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +10: [2023-05-13 03:28:20,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +20: [2023-05-13 03:28:20,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +14: [2023-05-13 03:28:20,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +14: [2023-05-13 03:28:20,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +26: [2023-05-13 03:28:20,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +14: [2023-05-13 03:28:20,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +31: [2023-05-13 03:28:20,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +22: [2023-05-13 03:28:20,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +31: [2023-05-13 03:28:20,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +31: [2023-05-13 03:28:20,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +22: [2023-05-13 03:28:20,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +22: [2023-05-13 03:28:20,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +31: [2023-05-13 03:28:20,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +11: [2023-05-13 03:28:20,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +22: [2023-05-13 03:28:20,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +27: [2023-05-13 03:28:20,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +25: [2023-05-13 03:28:20,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +22: [2023-05-13 03:28:20,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +31: [2023-05-13 03:28:20,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +27: [2023-05-13 03:28:20,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +31: [2023-05-13 03:28:20,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +27: [2023-05-13 03:28:20,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +19: [2023-05-13 03:28:20,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +19: [2023-05-13 03:28:20,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +19: [2023-05-13 03:28:20,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +27: [2023-05-13 03:28:20,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +27: [2023-05-13 03:28:20,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +27: [2023-05-13 03:28:20,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +27: [2023-05-13 03:28:20,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +27: [2023-05-13 03:28:20,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +16: [2023-05-13 03:28:20,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +16: [2023-05-13 03:28:20,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +19: [2023-05-13 03:28:20,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +19: [2023-05-13 03:28:20,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +16: [2023-05-13 03:28:20,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +16: [2023-05-13 03:28:20,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +16: [2023-05-13 03:28:20,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +16: [2023-05-13 03:28:20,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +16: [2023-05-13 03:28:20,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +25: [2023-05-13 03:28:20,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +26: [2023-05-13 03:28:20,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +26: [2023-05-13 03:28:20,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +20: [2023-05-13 03:28:20,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +16: [2023-05-13 03:28:20,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +17: [2023-05-13 03:28:20,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +26: [2023-05-13 03:28:20,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +18: [2023-05-13 03:28:20,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +18: [2023-05-13 03:28:20,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +18: [2023-05-13 03:28:20,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +18: [2023-05-13 03:28:20,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +20: [2023-05-13 03:28:20,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +11: [2023-05-13 03:28:20,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +11: [2023-05-13 03:28:20,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +11: [2023-05-13 03:28:20,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +22: [2023-05-13 03:28:20,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +14: [2023-05-13 03:28:20,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +20: [2023-05-13 03:28:20,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +14: [2023-05-13 03:28:20,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +11: [2023-05-13 03:28:20,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +27: [2023-05-13 03:28:20,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +17: [2023-05-13 03:28:20,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +19: [2023-05-13 03:28:20,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +17: [2023-05-13 03:28:20,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +22: [2023-05-13 03:28:20,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +10: [2023-05-13 03:28:20,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +11: [2023-05-13 03:28:20,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +11: [2023-05-13 03:28:20,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +17: [2023-05-13 03:28:20,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +19: [2023-05-13 03:28:20,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +19: [2023-05-13 03:28:20,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +30: [2023-05-13 03:28:20,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +30: [2023-05-13 03:28:20,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +17: [2023-05-13 03:28:20,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +18: [2023-05-13 03:28:20,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +28: [2023-05-13 03:28:20,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +13: [2023-05-13 03:28:20,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +13: [2023-05-13 03:28:20,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +13: [2023-05-13 03:28:20,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +21: [2023-05-13 03:28:20,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +21: [2023-05-13 03:28:20,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +16: [2023-05-13 03:28:20,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +30: [2023-05-13 03:28:20,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +16: [2023-05-13 03:28:20,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +16: [2023-05-13 03:28:20,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +16: [2023-05-13 03:28:20,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +21: [2023-05-13 03:28:20,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +16: [2023-05-13 03:28:20,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +16: [2023-05-13 03:28:20,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 8: [2023-05-13 03:28:20,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +27: [2023-05-13 03:28:20,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +27: [2023-05-13 03:28:20,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +22: [2023-05-13 03:28:20,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +16: [2023-05-13 03:28:20,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +21: [2023-05-13 03:28:20,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 8: [2023-05-13 03:28:20,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +22: [2023-05-13 03:28:20,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +16: [2023-05-13 03:28:20,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +22: [2023-05-13 03:28:20,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +22: [2023-05-13 03:28:20,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +21: [2023-05-13 03:28:20,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +27: [2023-05-13 03:28:20,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +27: [2023-05-13 03:28:20,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +27: [2023-05-13 03:28:20,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +10: [2023-05-13 03:28:20,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +27: [2023-05-13 03:28:20,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +27: [2023-05-13 03:28:20,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +10: [2023-05-13 03:28:20,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +18: [2023-05-13 03:28:20,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +18: [2023-05-13 03:28:20,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 8: [2023-05-13 03:28:20,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +30: [2023-05-13 03:28:20,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +18: [2023-05-13 03:28:20,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +12: [2023-05-13 03:28:20,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt... +14: [2023-05-13 03:28:20,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +10: [2023-05-13 03:28:20,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +10: [2023-05-13 03:28:20,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +10: [2023-05-13 03:28:20,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +30: [2023-05-13 03:28:20,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +12: [2023-05-13 03:28:20,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +12: [2023-05-13 03:28:20,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +28: [2023-05-13 03:28:20,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +30: [2023-05-13 03:28:20,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +30: [2023-05-13 03:28:20,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +28: [2023-05-13 03:28:20,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +28: [2023-05-13 03:28:20,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +30: [2023-05-13 03:28:20,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +13: [2023-05-13 03:28:20,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +13: [2023-05-13 03:28:20,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +13: [2023-05-13 03:28:20,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +13: [2023-05-13 03:28:20,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +28: [2023-05-13 03:28:20,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 8: [2023-05-13 03:28:20,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +14: [2023-05-13 03:28:20,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +14: [2023-05-13 03:28:20,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +14: [2023-05-13 03:28:20,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +14: [2023-05-13 03:28:20,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +14: [2023-05-13 03:28:20,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +13: [2023-05-13 03:28:20,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +11: [2023-05-13 03:28:20,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +28: [2023-05-13 03:28:20,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +19: [2023-05-13 03:28:20,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +30: [2023-05-13 03:28:20,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +14: [2023-05-13 03:28:20,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +18: [2023-05-13 03:28:20,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +30: [2023-05-13 03:28:20,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +28: [2023-05-13 03:28:20,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +28: [2023-05-13 03:28:20,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +18: [2023-05-13 03:28:20,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +14: [2023-05-13 03:28:20,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +18: [2023-05-13 03:28:20,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +18: [2023-05-13 03:28:20,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +19: [2023-05-13 03:28:20,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +19: [2023-05-13 03:28:20,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +12: [2023-05-13 03:28:20,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +12: [2023-05-13 03:28:20,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +12: [2023-05-13 03:28:20,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +12: [2023-05-13 03:28:20,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +12: [2023-05-13 03:28:20,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +13: [2023-05-13 03:28:20,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +18: [2023-05-13 03:28:20,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +11: [2023-05-13 03:28:20,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +11: [2023-05-13 03:28:20,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +13: [2023-05-13 03:28:20,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +11: [2023-05-13 03:28:20,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +11: [2023-05-13 03:28:20,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +11: [2023-05-13 03:28:20,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +13: [2023-05-13 03:28:20,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +30: [2023-05-13 03:28:20,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +11: [2023-05-13 03:28:20,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +19: [2023-05-13 03:28:20,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +19: [2023-05-13 03:28:20,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +12: [2023-05-13 03:28:20,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +30: [2023-05-13 03:28:20,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +31: [2023-05-13 03:28:20,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +30: [2023-05-13 03:28:20,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +31: [2023-05-13 03:28:20,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +19: [2023-05-13 03:28:20,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +19: [2023-05-13 03:28:20,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 6: [2023-05-13 03:28:20,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 6: [2023-05-13 03:28:20,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 6: [2023-05-13 03:28:20,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +30: [2023-05-13 03:28:20,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +28: [2023-05-13 03:28:20,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +19: [2023-05-13 03:28:20,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +30: [2023-05-13 03:28:20,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +12: [2023-05-13 03:28:20,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +12: [2023-05-13 03:28:20,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 6: [2023-05-13 03:28:20,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +28: [2023-05-13 03:28:20,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +30: [2023-05-13 03:28:20,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +28: [2023-05-13 03:28:20,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +28: [2023-05-13 03:28:20,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +13: [2023-05-13 03:28:20,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +13: [2023-05-13 03:28:20,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +13: [2023-05-13 03:28:20,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +13: [2023-05-13 03:28:20,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +28: [2023-05-13 03:28:20,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +28: [2023-05-13 03:28:20,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +28: [2023-05-13 03:28:20,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +12: [2023-05-13 03:28:20,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +27: [2023-05-13 03:28:20,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 6: [2023-05-13 03:28:20,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +12: [2023-05-13 03:28:20,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +12: [2023-05-13 03:28:20,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +12: [2023-05-13 03:28:20,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +13: [2023-05-13 03:28:20,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +22: [2023-05-13 03:28:20,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +12: [2023-05-13 03:28:20,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +31: [2023-05-13 03:28:20,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +31: [2023-05-13 03:28:20,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +31: [2023-05-13 03:28:20,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +31: [2023-05-13 03:28:20,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +31: [2023-05-13 03:28:20,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 6: [2023-05-13 03:28:20,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +16: [2023-05-13 03:28:20,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +16: [2023-05-13 03:28:20,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 6: [2023-05-13 03:28:20,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +16: [2023-05-13 03:28:20,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +16: [2023-05-13 03:28:20,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +16: [2023-05-13 03:28:20,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +31: [2023-05-13 03:28:20,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +31: [2023-05-13 03:28:20,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +31: [2023-05-13 03:28:20,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +16: [2023-05-13 03:28:20,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +16: [2023-05-13 03:28:20,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +16: [2023-05-13 03:28:20,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 6: [2023-05-13 03:28:20,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +27: [2023-05-13 03:28:20,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +17: [2023-05-13 03:28:20,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +17: [2023-05-13 03:28:20,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +17: [2023-05-13 03:28:20,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +17: [2023-05-13 03:28:20,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +17: [2023-05-13 03:28:20,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +22: [2023-05-13 03:28:20,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +22: [2023-05-13 03:28:20,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +22: [2023-05-13 03:28:20,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +22: [2023-05-13 03:28:20,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +22: [2023-05-13 03:28:20,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +27: [2023-05-13 03:28:20,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +27: [2023-05-13 03:28:20,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +31: [2023-05-13 03:28:20,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +31: [2023-05-13 03:28:20,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +16: [2023-05-13 03:28:20,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +31: [2023-05-13 03:28:20,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +16: [2023-05-13 03:28:20,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +16: [2023-05-13 03:28:20,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +16: [2023-05-13 03:28:20,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +16: [2023-05-13 03:28:20,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +31: [2023-05-13 03:28:20,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +27: [2023-05-13 03:28:20,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +27: [2023-05-13 03:28:20,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +27: [2023-05-13 03:28:20,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +27: [2023-05-13 03:28:20,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +27: [2023-05-13 03:28:20,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_01-model_00-model_states.pt. +16: [2023-05-13 03:28:20,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +16: [2023-05-13 03:28:20,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +31: [2023-05-13 03:28:20,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +31: [2023-05-13 03:28:20,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +16: [2023-05-13 03:28:20,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +27: [2023-05-13 03:28:20,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +27: [2023-05-13 03:28:20,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +27: [2023-05-13 03:28:20,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +27: [2023-05-13 03:28:20,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +27: [2023-05-13 03:28:20,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +27: [2023-05-13 03:28:20,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +27: [2023-05-13 03:28:20,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +23: [2023-05-13 03:28:20,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +23: [2023-05-13 03:28:20,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +23: [2023-05-13 03:28:20,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +23: [2023-05-13 03:28:20,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +23: [2023-05-13 03:28:20,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +23: [2023-05-13 03:28:20,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +23: [2023-05-13 03:28:20,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +23: [2023-05-13 03:28:20,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +23: [2023-05-13 03:28:20,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +23: [2023-05-13 03:28:20,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +10: [2023-05-13 03:28:20,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +10: [2023-05-13 03:28:20,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +10: [2023-05-13 03:28:20,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +10: [2023-05-13 03:28:20,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +10: [2023-05-13 03:28:20,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +26: [2023-05-13 03:28:20,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +26: [2023-05-13 03:28:20,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +10: [2023-05-13 03:28:20,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +10: [2023-05-13 03:28:20,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +10: [2023-05-13 03:28:20,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +26: [2023-05-13 03:28:20,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +23: [2023-05-13 03:28:20,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +26: [2023-05-13 03:28:20,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +26: [2023-05-13 03:28:20,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +26: [2023-05-13 03:28:20,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +26: [2023-05-13 03:28:20,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +26: [2023-05-13 03:28:20,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +23: [2023-05-13 03:28:20,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +23: [2023-05-13 03:28:20,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +23: [2023-05-13 03:28:20,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +23: [2023-05-13 03:28:20,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +23: [2023-05-13 03:28:20,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +10: [2023-05-13 03:28:20,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +10: [2023-05-13 03:28:20,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +26: [2023-05-13 03:28:20,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +26: [2023-05-13 03:28:20,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +26: [2023-05-13 03:28:20,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +21: [2023-05-13 03:28:20,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +21: [2023-05-13 03:28:20,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +21: [2023-05-13 03:28:20,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +21: [2023-05-13 03:28:20,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +21: [2023-05-13 03:28:20,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +21: [2023-05-13 03:28:20,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +21: [2023-05-13 03:28:20,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +21: [2023-05-13 03:28:20,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +10: [2023-05-13 03:28:20,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +10: [2023-05-13 03:28:20,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +10: [2023-05-13 03:28:20,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +10: [2023-05-13 03:28:20,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +10: [2023-05-13 03:28:20,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +10: [2023-05-13 03:28:20,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +26: [2023-05-13 03:28:20,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +26: [2023-05-13 03:28:20,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +26: [2023-05-13 03:28:20,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +26: [2023-05-13 03:28:20,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +21: [2023-05-13 03:28:20,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +21: [2023-05-13 03:28:20,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +26: [2023-05-13 03:28:20,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +21: [2023-05-13 03:28:20,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +21: [2023-05-13 03:28:20,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +21: [2023-05-13 03:28:20,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +21: [2023-05-13 03:28:20,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +21: [2023-05-13 03:28:20,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +21: [2023-05-13 03:28:20,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +24: [2023-05-13 03:28:20,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +24: [2023-05-13 03:28:20,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +24: [2023-05-13 03:28:20,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +24: [2023-05-13 03:28:20,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +24: [2023-05-13 03:28:20,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +24: [2023-05-13 03:28:20,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +24: [2023-05-13 03:28:20,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +24: [2023-05-13 03:28:20,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +24: [2023-05-13 03:28:20,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +24: [2023-05-13 03:28:20,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +24: [2023-05-13 03:28:20,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +23: [2023-05-13 03:28:20,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +23: [2023-05-13 03:28:20,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +24: [2023-05-13 03:28:20,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +24: [2023-05-13 03:28:20,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +24: [2023-05-13 03:28:20,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +24: [2023-05-13 03:28:20,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +24: [2023-05-13 03:28:20,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +10: [2023-05-13 03:28:20,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +10: [2023-05-13 03:28:20,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +26: [2023-05-13 03:28:20,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +26: [2023-05-13 03:28:20,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +26: [2023-05-13 03:28:20,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +21: [2023-05-13 03:28:20,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +21: [2023-05-13 03:28:20,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +21: [2023-05-13 03:28:20,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +23: [2023-05-13 03:28:20,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +23: [2023-05-13 03:28:20,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +23: [2023-05-13 03:28:20,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +26: [2023-05-13 03:28:20,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +26: [2023-05-13 03:28:20,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +26: [2023-05-13 03:28:20,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +10: [2023-05-13 03:28:20,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +23: [2023-05-13 03:28:20,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +23: [2023-05-13 03:28:20,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +23: [2023-05-13 03:28:20,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +26: [2023-05-13 03:28:20,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +26: [2023-05-13 03:28:20,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +10: [2023-05-13 03:28:20,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +11: [2023-05-13 03:28:20,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +11: [2023-05-13 03:28:20,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +11: [2023-05-13 03:28:20,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +11: [2023-05-13 03:28:20,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +10: [2023-05-13 03:28:20,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +11: [2023-05-13 03:28:20,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +11: [2023-05-13 03:28:20,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +21: [2023-05-13 03:28:20,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +11: [2023-05-13 03:28:20,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +21: [2023-05-13 03:28:20,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +11: [2023-05-13 03:28:20,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +23: [2023-05-13 03:28:20,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +10: [2023-05-13 03:28:20,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +10: [2023-05-13 03:28:20,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +10: [2023-05-13 03:28:20,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +10: [2023-05-13 03:28:20,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +10: [2023-05-13 03:28:20,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +23: [2023-05-13 03:28:20,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +11: [2023-05-13 03:28:20,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +21: [2023-05-13 03:28:20,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +21: [2023-05-13 03:28:20,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +21: [2023-05-13 03:28:20,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +11: [2023-05-13 03:28:20,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +11: [2023-05-13 03:28:20,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +11: [2023-05-13 03:28:20,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +11: [2023-05-13 03:28:20,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +11: [2023-05-13 03:28:20,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +26: [2023-05-13 03:28:20,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +11: [2023-05-13 03:28:20,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +26: [2023-05-13 03:28:20,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +11: [2023-05-13 03:28:20,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +26: [2023-05-13 03:28:20,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +21: [2023-05-13 03:28:20,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +21: [2023-05-13 03:28:20,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +21: [2023-05-13 03:28:20,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +15: [2023-05-13 03:28:20,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +15: [2023-05-13 03:28:20,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +15: [2023-05-13 03:28:20,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +15: [2023-05-13 03:28:20,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +15: [2023-05-13 03:28:20,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +15: [2023-05-13 03:28:20,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +15: [2023-05-13 03:28:20,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +15: [2023-05-13 03:28:20,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 4: [2023-05-13 03:28:20,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +10: [2023-05-13 03:28:20,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +15: [2023-05-13 03:28:20,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 4: [2023-05-13 03:28:20,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +24: [2023-05-13 03:28:20,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +24: [2023-05-13 03:28:20,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +24: [2023-05-13 03:28:20,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 7: [2023-05-13 03:28:20,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +26: [2023-05-13 03:28:20,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +26: [2023-05-13 03:28:20,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +26: [2023-05-13 03:28:20,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +15: [2023-05-13 03:28:20,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +15: [2023-05-13 03:28:20,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +15: [2023-05-13 03:28:20,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +23: [2023-05-13 03:28:20,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +15: [2023-05-13 03:28:20,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +23: [2023-05-13 03:28:20,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +15: [2023-05-13 03:28:20,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +10: [2023-05-13 03:28:20,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +23: [2023-05-13 03:28:20,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +15: [2023-05-13 03:28:20,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +15: [2023-05-13 03:28:20,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +21: [2023-05-13 03:28:20,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +23: [2023-05-13 03:28:20,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +24: [2023-05-13 03:28:20,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +23: [2023-05-13 03:28:20,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +21: [2023-05-13 03:28:20,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +21: [2023-05-13 03:28:20,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +10: [2023-05-13 03:28:20,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +21: [2023-05-13 03:28:20,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +23: [2023-05-13 03:28:20,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +10: [2023-05-13 03:28:20,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +10: [2023-05-13 03:28:20,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +26: [2023-05-13 03:28:20,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +26: [2023-05-13 03:28:20,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +10: [2023-05-13 03:28:20,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +24: [2023-05-13 03:28:20,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +24: [2023-05-13 03:28:20,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +24: [2023-05-13 03:28:20,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +24: [2023-05-13 03:28:20,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +21: [2023-05-13 03:28:20,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 7: [2023-05-13 03:28:20,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +11: [2023-05-13 03:28:20,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +24: [2023-05-13 03:28:20,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +24: [2023-05-13 03:28:20,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +24: [2023-05-13 03:28:20,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +24: [2023-05-13 03:28:20,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +20: [2023-05-13 03:28:20,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +20: [2023-05-13 03:28:20,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +20: [2023-05-13 03:28:20,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +20: [2023-05-13 03:28:20,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +20: [2023-05-13 03:28:20,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +20: [2023-05-13 03:28:20,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +20: [2023-05-13 03:28:20,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +20: [2023-05-13 03:28:20,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +24: [2023-05-13 03:28:20,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +18: [2023-05-13 03:28:20,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +18: [2023-05-13 03:28:20,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +18: [2023-05-13 03:28:20,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +18: [2023-05-13 03:28:20,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +18: [2023-05-13 03:28:20,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +18: [2023-05-13 03:28:20,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +18: [2023-05-13 03:28:20,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +18: [2023-05-13 03:28:20,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +24: [2023-05-13 03:28:20,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +30: [2023-05-13 03:28:20,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +30: [2023-05-13 03:28:20,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +30: [2023-05-13 03:28:20,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +30: [2023-05-13 03:28:20,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +30: [2023-05-13 03:28:20,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +30: [2023-05-13 03:28:20,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +30: [2023-05-13 03:28:20,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +30: [2023-05-13 03:28:20,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +11: [2023-05-13 03:28:20,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +15: [2023-05-13 03:28:20,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +24: [2023-05-13 03:28:20,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +20: [2023-05-13 03:28:20,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +20: [2023-05-13 03:28:20,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +24: [2023-05-13 03:28:20,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +22: [2023-05-13 03:28:20,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +22: [2023-05-13 03:28:20,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +22: [2023-05-13 03:28:20,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +22: [2023-05-13 03:28:20,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +22: [2023-05-13 03:28:20,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +22: [2023-05-13 03:28:20,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +22: [2023-05-13 03:28:20,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +18: [2023-05-13 03:28:20,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +18: [2023-05-13 03:28:20,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +18: [2023-05-13 03:28:20,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +11: [2023-05-13 03:28:20,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +11: [2023-05-13 03:28:20,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +11: [2023-05-13 03:28:20,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +20: [2023-05-13 03:28:20,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +20: [2023-05-13 03:28:20,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +18: [2023-05-13 03:28:20,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +20: [2023-05-13 03:28:20,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +30: [2023-05-13 03:28:20,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +18: [2023-05-13 03:28:20,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +20: [2023-05-13 03:28:20,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +18: [2023-05-13 03:28:20,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +30: [2023-05-13 03:28:20,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +18: [2023-05-13 03:28:20,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +30: [2023-05-13 03:28:20,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +20: [2023-05-13 03:28:20,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +18: [2023-05-13 03:28:20,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +20: [2023-05-13 03:28:20,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +11: [2023-05-13 03:28:20,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +11: [2023-05-13 03:28:20,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +11: [2023-05-13 03:28:20,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +11: [2023-05-13 03:28:20,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +30: [2023-05-13 03:28:20,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +30: [2023-05-13 03:28:20,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +30: [2023-05-13 03:28:20,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +30: [2023-05-13 03:28:20,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +30: [2023-05-13 03:28:20,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +13: [2023-05-13 03:28:20,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +13: [2023-05-13 03:28:20,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +13: [2023-05-13 03:28:20,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +13: [2023-05-13 03:28:20,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +13: [2023-05-13 03:28:20,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +13: [2023-05-13 03:28:20,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +13: [2023-05-13 03:28:20,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +13: [2023-05-13 03:28:20,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +13: [2023-05-13 03:28:20,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +13: [2023-05-13 03:28:20,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +13: [2023-05-13 03:28:20,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +13: [2023-05-13 03:28:20,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +13: [2023-05-13 03:28:20,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +13: [2023-05-13 03:28:20,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +15: [2023-05-13 03:28:20,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +13: [2023-05-13 03:28:20,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +13: [2023-05-13 03:28:20,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +15: [2023-05-13 03:28:20,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +15: [2023-05-13 03:28:20,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +15: [2023-05-13 03:28:20,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +15: [2023-05-13 03:28:20,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +15: [2023-05-13 03:28:20,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +15: [2023-05-13 03:28:20,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +15: [2023-05-13 03:28:20,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +11: [2023-05-13 03:28:20,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +29: [2023-05-13 03:28:20,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +29: [2023-05-13 03:28:20,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +29: [2023-05-13 03:28:20,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +29: [2023-05-13 03:28:20,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +29: [2023-05-13 03:28:20,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +29: [2023-05-13 03:28:20,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +29: [2023-05-13 03:28:20,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +29: [2023-05-13 03:28:20,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +16: [2023-05-13 03:28:20,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +16: [2023-05-13 03:28:20,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +11: [2023-05-13 03:28:20,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +16: [2023-05-13 03:28:20,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +16: [2023-05-13 03:28:20,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +11: [2023-05-13 03:28:20,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +16: [2023-05-13 03:28:20,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +16: [2023-05-13 03:28:20,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +16: [2023-05-13 03:28:20,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +16: [2023-05-13 03:28:20,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +29: [2023-05-13 03:28:20,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +29: [2023-05-13 03:28:20,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +16: [2023-05-13 03:28:20,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +16: [2023-05-13 03:28:20,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +11: [2023-05-13 03:28:20,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +29: [2023-05-13 03:28:20,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +16: [2023-05-13 03:28:20,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +29: [2023-05-13 03:28:20,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +16: [2023-05-13 03:28:20,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +11: [2023-05-13 03:28:20,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +29: [2023-05-13 03:28:20,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +16: [2023-05-13 03:28:20,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +11: [2023-05-13 03:28:20,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +29: [2023-05-13 03:28:20,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +16: [2023-05-13 03:28:20,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +29: [2023-05-13 03:28:20,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +29: [2023-05-13 03:28:20,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +11: [2023-05-13 03:28:20,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +16: [2023-05-13 03:28:20,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +16: [2023-05-13 03:28:20,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +20: [2023-05-13 03:28:20,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +20: [2023-05-13 03:28:20,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +18: [2023-05-13 03:28:20,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +30: [2023-05-13 03:28:20,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +30: [2023-05-13 03:28:20,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +18: [2023-05-13 03:28:20,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +18: [2023-05-13 03:28:20,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +22: [2023-05-13 03:28:20,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +22: [2023-05-13 03:28:20,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +30: [2023-05-13 03:28:20,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +18: [2023-05-13 03:28:20,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +28: [2023-05-13 03:28:20,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +15: [2023-05-13 03:28:20,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +28: [2023-05-13 03:28:20,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +28: [2023-05-13 03:28:20,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +28: [2023-05-13 03:28:20,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +28: [2023-05-13 03:28:20,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +28: [2023-05-13 03:28:20,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +28: [2023-05-13 03:28:20,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +28: [2023-05-13 03:28:20,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +15: [2023-05-13 03:28:20,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +18: [2023-05-13 03:28:20,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +18: [2023-05-13 03:28:20,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +18: [2023-05-13 03:28:20,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +18: [2023-05-13 03:28:20,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +30: [2023-05-13 03:28:20,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +30: [2023-05-13 03:28:20,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +30: [2023-05-13 03:28:20,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +30: [2023-05-13 03:28:20,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +30: [2023-05-13 03:28:20,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +15: [2023-05-13 03:28:20,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +13: [2023-05-13 03:28:20,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +13: [2023-05-13 03:28:20,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +28: [2023-05-13 03:28:20,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +20: [2023-05-13 03:28:20,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +20: [2023-05-13 03:28:20,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +20: [2023-05-13 03:28:20,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +20: [2023-05-13 03:28:20,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +20: [2023-05-13 03:28:20,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +20: [2023-05-13 03:28:20,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +15: [2023-05-13 03:28:20,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +15: [2023-05-13 03:28:20,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +15: [2023-05-13 03:28:20,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +13: [2023-05-13 03:28:20,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +15: [2023-05-13 03:28:20,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +22: [2023-05-13 03:28:20,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +22: [2023-05-13 03:28:20,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +13: [2023-05-13 03:28:20,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +27: [2023-05-13 03:28:20,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +22: [2023-05-13 03:28:20,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +22: [2023-05-13 03:28:20,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +22: [2023-05-13 03:28:20,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +22: [2023-05-13 03:28:20,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +27: [2023-05-13 03:28:20,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +27: [2023-05-13 03:28:20,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +28: [2023-05-13 03:28:20,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +27: [2023-05-13 03:28:20,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +27: [2023-05-13 03:28:20,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +27: [2023-05-13 03:28:20,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +27: [2023-05-13 03:28:20,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +27: [2023-05-13 03:28:20,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +28: [2023-05-13 03:28:20,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 9: [2023-05-13 03:28:20,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +28: [2023-05-13 03:28:20,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +28: [2023-05-13 03:28:20,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +30: [2023-05-13 03:28:20,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +30: [2023-05-13 03:28:20,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +28: [2023-05-13 03:28:20,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +13: [2023-05-13 03:28:20,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +13: [2023-05-13 03:28:20,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +13: [2023-05-13 03:28:20,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +13: [2023-05-13 03:28:20,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +28: [2023-05-13 03:28:20,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +20: [2023-05-13 03:28:20,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +20: [2023-05-13 03:28:20,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +28: [2023-05-13 03:28:20,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +22: [2023-05-13 03:28:20,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +22: [2023-05-13 03:28:20,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +12: [2023-05-13 03:28:20,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +12: [2023-05-13 03:28:20,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +12: [2023-05-13 03:28:20,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +12: [2023-05-13 03:28:20,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +12: [2023-05-13 03:28:20,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +12: [2023-05-13 03:28:20,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +12: [2023-05-13 03:28:20,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +12: [2023-05-13 03:28:20,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +29: [2023-05-13 03:28:20,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +29: [2023-05-13 03:28:20,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +25: [2023-05-13 03:28:20,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +25: [2023-05-13 03:28:20,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +27: [2023-05-13 03:28:20,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +25: [2023-05-13 03:28:20,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +25: [2023-05-13 03:28:20,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +25: [2023-05-13 03:28:20,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +25: [2023-05-13 03:28:20,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +25: [2023-05-13 03:28:20,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +25: [2023-05-13 03:28:20,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +18: [2023-05-13 03:28:20,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +18: [2023-05-13 03:28:20,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +18: [2023-05-13 03:28:20,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 1: [2023-05-13 03:28:20,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 1: [2023-05-13 03:28:20,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 8: [2023-05-13 03:28:20,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +13: [2023-05-13 03:28:20,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 8: [2023-05-13 03:28:20,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +19: [2023-05-13 03:28:20,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +19: [2023-05-13 03:28:20,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +19: [2023-05-13 03:28:20,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +19: [2023-05-13 03:28:20,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +19: [2023-05-13 03:28:20,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +18: [2023-05-13 03:28:20,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +19: [2023-05-13 03:28:20,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +19: [2023-05-13 03:28:20,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +19: [2023-05-13 03:28:20,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +12: [2023-05-13 03:28:20,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 6: [2023-05-13 03:28:20,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +12: [2023-05-13 03:28:20,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +25: [2023-05-13 03:28:20,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 6: [2023-05-13 03:28:20,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 6: [2023-05-13 03:28:20,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 6: [2023-05-13 03:28:20,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +12: [2023-05-13 03:28:20,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +12: [2023-05-13 03:28:20,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +25: [2023-05-13 03:28:20,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +12: [2023-05-13 03:28:20,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +12: [2023-05-13 03:28:20,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +13: [2023-05-13 03:28:20,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +25: [2023-05-13 03:28:20,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +30: [2023-05-13 03:28:20,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 5: [2023-05-13 03:28:20,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +12: [2023-05-13 03:28:20,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +12: [2023-05-13 03:28:20,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 5: [2023-05-13 03:28:20,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +27: [2023-05-13 03:28:20,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 8: [2023-05-13 03:28:20,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +27: [2023-05-13 03:28:20,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 8: [2023-05-13 03:28:20,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +25: [2023-05-13 03:28:20,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +25: [2023-05-13 03:28:20,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +25: [2023-05-13 03:28:20,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +27: [2023-05-13 03:28:20,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +25: [2023-05-13 03:28:20,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +25: [2023-05-13 03:28:20,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +27: [2023-05-13 03:28:20,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +27: [2023-05-13 03:28:20,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +19: [2023-05-13 03:28:20,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +19: [2023-05-13 03:28:20,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +31: [2023-05-13 03:28:20,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +31: [2023-05-13 03:28:20,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +27: [2023-05-13 03:28:20,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 3: [2023-05-13 03:28:20,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +19: [2023-05-13 03:28:20,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +27: [2023-05-13 03:28:20,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +18: [2023-05-13 03:28:20,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +16: [2023-05-13 03:28:20,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +16: [2023-05-13 03:28:20,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +16: [2023-05-13 03:28:20,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +17: [2023-05-13 03:28:20,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 3: [2023-05-13 03:28:20,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 3: [2023-05-13 03:28:20,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 3: [2023-05-13 03:28:20,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 3: [2023-05-13 03:28:20,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +18: [2023-05-13 03:28:20,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +17: [2023-05-13 03:28:20,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +17: [2023-05-13 03:28:20,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +17: [2023-05-13 03:28:20,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 3: [2023-05-13 03:28:20,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +17: [2023-05-13 03:28:20,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +17: [2023-05-13 03:28:20,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +17: [2023-05-13 03:28:20,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 3: [2023-05-13 03:28:20,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +31: [2023-05-13 03:28:20,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +31: [2023-05-13 03:28:20,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +31: [2023-05-13 03:28:20,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +31: [2023-05-13 03:28:20,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +31: [2023-05-13 03:28:20,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +31: [2023-05-13 03:28:20,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 0: [2023-05-13 03:28:20,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +30: [2023-05-13 03:28:20,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 8: [2023-05-13 03:28:20,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 8: [2023-05-13 03:28:20,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +16: [2023-05-13 03:28:20,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 8: [2023-05-13 03:28:20,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +19: [2023-05-13 03:28:20,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +19: [2023-05-13 03:28:20,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +19: [2023-05-13 03:28:20,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +19: [2023-05-13 03:28:20,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +14: [2023-05-13 03:28:20,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +14: [2023-05-13 03:28:20,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +14: [2023-05-13 03:28:20,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +14: [2023-05-13 03:28:20,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +14: [2023-05-13 03:28:20,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +14: [2023-05-13 03:28:20,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +14: [2023-05-13 03:28:20,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +14: [2023-05-13 03:28:20,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +16: [2023-05-13 03:28:20,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +16: [2023-05-13 03:28:20,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +16: [2023-05-13 03:28:20,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +16: [2023-05-13 03:28:20,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +19: [2023-05-13 03:28:20,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 2: [2023-05-13 03:28:20,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 8: [2023-05-13 03:28:20,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 8: [2023-05-13 03:28:20,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +18: [2023-05-13 03:28:20,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +18: [2023-05-13 03:28:20,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +31: [2023-05-13 03:28:20,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +31: [2023-05-13 03:28:20,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +13: [2023-05-13 03:28:20,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +29: [2023-05-13 03:28:20,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +29: [2023-05-13 03:28:20,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +30: [2023-05-13 03:28:20,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +30: [2023-05-13 03:28:20,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +14: [2023-05-13 03:28:20,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 6: [2023-05-13 03:28:20,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:20,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +14: [2023-05-13 03:28:20,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +13: [2023-05-13 03:28:20,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +22: [2023-05-13 03:28:20,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +14: [2023-05-13 03:28:20,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +29: [2023-05-13 03:28:20,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:20,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +14: [2023-05-13 03:28:20,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +14: [2023-05-13 03:28:20,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 0: [2023-05-13 03:28:20,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +14: [2023-05-13 03:28:20,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +29: [2023-05-13 03:28:20,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 3: [2023-05-13 03:28:20,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +30: [2023-05-13 03:28:20,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +30: [2023-05-13 03:28:20,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +20: [2023-05-13 03:28:20,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +29: [2023-05-13 03:28:20,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +22: [2023-05-13 03:28:20,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +29: [2023-05-13 03:28:20,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +29: [2023-05-13 03:28:20,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +29: [2023-05-13 03:28:20,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +20: [2023-05-13 03:28:20,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +31: [2023-05-13 03:28:20,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +20: [2023-05-13 03:28:20,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +31: [2023-05-13 03:28:20,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +20: [2023-05-13 03:28:20,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +17: [2023-05-13 03:28:20,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +31: [2023-05-13 03:28:20,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +20: [2023-05-13 03:28:20,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +31: [2023-05-13 03:28:20,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +20: [2023-05-13 03:28:20,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +31: [2023-05-13 03:28:20,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +31: [2023-05-13 03:28:20,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +13: [2023-05-13 03:28:20,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +28: [2023-05-13 03:28:20,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +17: [2023-05-13 03:28:20,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +17: [2023-05-13 03:28:20,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt... +22: [2023-05-13 03:28:20,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +22: [2023-05-13 03:28:20,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +22: [2023-05-13 03:28:20,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +22: [2023-05-13 03:28:20,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +13: [2023-05-13 03:28:20,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +13: [2023-05-13 03:28:20,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +13: [2023-05-13 03:28:20,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 9: [2023-05-13 03:28:20,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +29: [2023-05-13 03:28:20,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +16: [2023-05-13 03:28:20,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +16: [2023-05-13 03:28:20,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +16: [2023-05-13 03:28:20,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +29: [2023-05-13 03:28:20,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +16: [2023-05-13 03:28:20,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +16: [2023-05-13 03:28:20,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +16: [2023-05-13 03:28:20,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +16: [2023-05-13 03:28:20,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +16: [2023-05-13 03:28:20,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +12: [2023-05-13 03:28:20,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +12: [2023-05-13 03:28:20,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 8: [2023-05-13 03:28:20,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +12: [2023-05-13 03:28:20,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 2: [2023-05-13 03:28:20,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +25: [2023-05-13 03:28:20,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +25: [2023-05-13 03:28:20,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +25: [2023-05-13 03:28:20,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +28: [2023-05-13 03:28:20,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +29: [2023-05-13 03:28:20,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +29: [2023-05-13 03:28:20,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +28: [2023-05-13 03:28:20,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +28: [2023-05-13 03:28:20,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +28: [2023-05-13 03:28:20,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +29: [2023-05-13 03:28:20,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +29: [2023-05-13 03:28:20,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +27: [2023-05-13 03:28:21,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +19: [2023-05-13 03:28:21,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +19: [2023-05-13 03:28:21,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +25: [2023-05-13 03:28:21,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +19: [2023-05-13 03:28:21,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +28: [2023-05-13 03:28:21,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +28: [2023-05-13 03:28:21,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +28: [2023-05-13 03:28:21,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +28: [2023-05-13 03:28:21,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +12: [2023-05-13 03:28:21,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +12: [2023-05-13 03:28:21,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +12: [2023-05-13 03:28:21,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +12: [2023-05-13 03:28:21,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +12: [2023-05-13 03:28:21,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +25: [2023-05-13 03:28:21,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +25: [2023-05-13 03:28:21,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +25: [2023-05-13 03:28:21,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +25: [2023-05-13 03:28:21,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +14: [2023-05-13 03:28:21,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +14: [2023-05-13 03:28:21,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +17: [2023-05-13 03:28:21,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +14: [2023-05-13 03:28:21,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +31: [2023-05-13 03:28:21,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +31: [2023-05-13 03:28:21,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +27: [2023-05-13 03:28:21,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +27: [2023-05-13 03:28:21,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +19: [2023-05-13 03:28:21,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +19: [2023-05-13 03:28:21,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +19: [2023-05-13 03:28:21,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +19: [2023-05-13 03:28:21,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +19: [2023-05-13 03:28:21,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:21,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +12: [2023-05-13 03:28:21,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +12: [2023-05-13 03:28:21,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:21,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +14: [2023-05-13 03:28:21,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +14: [2023-05-13 03:28:21,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +14: [2023-05-13 03:28:21,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +25: [2023-05-13 03:28:21,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +25: [2023-05-13 03:28:21,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +25: [2023-05-13 03:28:21,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +12: [2023-05-13 03:28:21,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +27: [2023-05-13 03:28:21,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +27: [2023-05-13 03:28:21,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +27: [2023-05-13 03:28:21,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +27: [2023-05-13 03:28:21,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +27: [2023-05-13 03:28:21,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +31: [2023-05-13 03:28:21,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +31: [2023-05-13 03:28:21,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +31: [2023-05-13 03:28:21,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +19: [2023-05-13 03:28:21,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +19: [2023-05-13 03:28:21,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +31: [2023-05-13 03:28:21,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +31: [2023-05-13 03:28:21,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +31: [2023-05-13 03:28:21,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +28: [2023-05-13 03:28:21,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +25: [2023-05-13 03:28:21,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:21,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +12: [2023-05-13 03:28:21,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +28: [2023-05-13 03:28:21,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +14: [2023-05-13 03:28:21,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +27: [2023-05-13 03:28:21,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +17: [2023-05-13 03:28:21,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +19: [2023-05-13 03:28:21,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +28: [2023-05-13 03:28:21,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:21,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +25: [2023-05-13 03:28:21,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +25: [2023-05-13 03:28:21,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +17: [2023-05-13 03:28:21,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +17: [2023-05-13 03:28:21,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +25: [2023-05-13 03:28:21,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +25: [2023-05-13 03:28:21,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +17: [2023-05-13 03:28:21,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +17: [2023-05-13 03:28:21,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +12: [2023-05-13 03:28:21,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +12: [2023-05-13 03:28:21,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +12: [2023-05-13 03:28:21,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +12: [2023-05-13 03:28:21,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +27: [2023-05-13 03:28:21,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +27: [2023-05-13 03:28:21,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +31: [2023-05-13 03:28:21,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +17: [2023-05-13 03:28:21,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +17: [2023-05-13 03:28:21,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_03-model_00-model_states.pt. +17: [2023-05-13 03:28:21,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +31: [2023-05-13 03:28:21,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +28: [2023-05-13 03:28:21,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +28: [2023-05-13 03:28:21,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +28: [2023-05-13 03:28:21,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:21,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +28: [2023-05-13 03:28:21,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +19: [2023-05-13 03:28:21,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +19: [2023-05-13 03:28:21,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +19: [2023-05-13 03:28:21,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:21,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:21,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:21,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:21,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +19: [2023-05-13 03:28:21,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +19: [2023-05-13 03:28:21,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +27: [2023-05-13 03:28:21,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +27: [2023-05-13 03:28:21,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +27: [2023-05-13 03:28:21,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +27: [2023-05-13 03:28:21,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +31: [2023-05-13 03:28:21,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +27: [2023-05-13 03:28:21,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +31: [2023-05-13 03:28:21,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +31: [2023-05-13 03:28:21,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +31: [2023-05-13 03:28:21,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +17: [2023-05-13 03:28:21,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +31: [2023-05-13 03:28:21,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +31: [2023-05-13 03:28:21,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +17: [2023-05-13 03:28:21,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +17: [2023-05-13 03:28:21,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +17: [2023-05-13 03:28:21,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +17: [2023-05-13 03:28:21,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +17: [2023-05-13 03:28:21,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +17: [2023-05-13 03:28:21,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +21: [2023-05-13 03:28:21,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +21: [2023-05-13 03:28:21,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +21: [2023-05-13 03:28:21,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +21: [2023-05-13 03:28:21,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +21: [2023-05-13 03:28:21,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +21: [2023-05-13 03:28:21,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +21: [2023-05-13 03:28:21,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +21: [2023-05-13 03:28:21,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +21: [2023-05-13 03:28:21,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +21: [2023-05-13 03:28:21,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +21: [2023-05-13 03:28:21,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +21: [2023-05-13 03:28:21,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +21: [2023-05-13 03:28:21,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +21: [2023-05-13 03:28:21,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +21: [2023-05-13 03:28:21,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +21: [2023-05-13 03:28:21,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +21: [2023-05-13 03:28:21,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +21: [2023-05-13 03:28:21,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +21: [2023-05-13 03:28:21,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +21: [2023-05-13 03:28:21,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +21: [2023-05-13 03:28:21,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +21: [2023-05-13 03:28:21,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +21: [2023-05-13 03:28:21,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +21: [2023-05-13 03:28:21,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +21: [2023-05-13 03:28:21,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +21: [2023-05-13 03:28:21,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +21: [2023-05-13 03:28:21,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +21: [2023-05-13 03:28:21,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +21: [2023-05-13 03:28:21,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +21: [2023-05-13 03:28:21,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +21: [2023-05-13 03:28:21,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +21: [2023-05-13 03:28:21,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +23: [2023-05-13 03:28:21,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +23: [2023-05-13 03:28:21,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +23: [2023-05-13 03:28:21,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +23: [2023-05-13 03:28:21,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +23: [2023-05-13 03:28:21,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +23: [2023-05-13 03:28:21,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +23: [2023-05-13 03:28:21,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +23: [2023-05-13 03:28:21,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +23: [2023-05-13 03:28:21,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +23: [2023-05-13 03:28:21,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +23: [2023-05-13 03:28:21,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +10: [2023-05-13 03:28:21,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +10: [2023-05-13 03:28:21,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +10: [2023-05-13 03:28:21,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +10: [2023-05-13 03:28:21,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +10: [2023-05-13 03:28:21,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +10: [2023-05-13 03:28:21,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +10: [2023-05-13 03:28:21,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +10: [2023-05-13 03:28:21,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +23: [2023-05-13 03:28:21,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +23: [2023-05-13 03:28:21,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +23: [2023-05-13 03:28:21,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +23: [2023-05-13 03:28:21,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +23: [2023-05-13 03:28:21,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +10: [2023-05-13 03:28:21,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +10: [2023-05-13 03:28:21,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +10: [2023-05-13 03:28:21,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +10: [2023-05-13 03:28:21,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +10: [2023-05-13 03:28:21,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +10: [2023-05-13 03:28:21,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +10: [2023-05-13 03:28:21,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +10: [2023-05-13 03:28:21,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +11: [2023-05-13 03:28:21,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +11: [2023-05-13 03:28:21,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +11: [2023-05-13 03:28:21,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +11: [2023-05-13 03:28:21,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +11: [2023-05-13 03:28:21,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +11: [2023-05-13 03:28:21,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +11: [2023-05-13 03:28:21,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +11: [2023-05-13 03:28:21,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +24: [2023-05-13 03:28:21,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +24: [2023-05-13 03:28:21,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +24: [2023-05-13 03:28:21,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +24: [2023-05-13 03:28:21,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +24: [2023-05-13 03:28:21,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +24: [2023-05-13 03:28:21,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +24: [2023-05-13 03:28:21,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +24: [2023-05-13 03:28:21,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +11: [2023-05-13 03:28:21,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +24: [2023-05-13 03:28:21,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +24: [2023-05-13 03:28:21,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +24: [2023-05-13 03:28:21,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +24: [2023-05-13 03:28:21,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +24: [2023-05-13 03:28:21,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +24: [2023-05-13 03:28:21,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +24: [2023-05-13 03:28:21,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +24: [2023-05-13 03:28:21,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +11: [2023-05-13 03:28:21,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +11: [2023-05-13 03:28:21,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +11: [2023-05-13 03:28:21,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +11: [2023-05-13 03:28:21,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +11: [2023-05-13 03:28:21,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +15: [2023-05-13 03:28:21,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +15: [2023-05-13 03:28:21,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +15: [2023-05-13 03:28:21,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +15: [2023-05-13 03:28:21,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +15: [2023-05-13 03:28:21,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +15: [2023-05-13 03:28:21,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +15: [2023-05-13 03:28:21,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +15: [2023-05-13 03:28:21,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +11: [2023-05-13 03:28:21,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +11: [2023-05-13 03:28:21,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +15: [2023-05-13 03:28:21,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +23: [2023-05-13 03:28:21,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +23: [2023-05-13 03:28:21,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +15: [2023-05-13 03:28:21,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +15: [2023-05-13 03:28:21,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +15: [2023-05-13 03:28:21,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +18: [2023-05-13 03:28:21,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +18: [2023-05-13 03:28:21,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +18: [2023-05-13 03:28:21,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +18: [2023-05-13 03:28:21,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +18: [2023-05-13 03:28:21,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +10: [2023-05-13 03:28:21,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +10: [2023-05-13 03:28:21,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +18: [2023-05-13 03:28:21,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +18: [2023-05-13 03:28:21,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +18: [2023-05-13 03:28:21,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +15: [2023-05-13 03:28:21,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +15: [2023-05-13 03:28:21,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +15: [2023-05-13 03:28:21,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +15: [2023-05-13 03:28:21,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +20: [2023-05-13 03:28:21,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +20: [2023-05-13 03:28:21,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +20: [2023-05-13 03:28:21,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +20: [2023-05-13 03:28:21,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +20: [2023-05-13 03:28:21,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +20: [2023-05-13 03:28:21,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +20: [2023-05-13 03:28:21,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +20: [2023-05-13 03:28:21,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +18: [2023-05-13 03:28:21,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +18: [2023-05-13 03:28:21,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +18: [2023-05-13 03:28:21,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +20: [2023-05-13 03:28:21,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +20: [2023-05-13 03:28:21,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +18: [2023-05-13 03:28:21,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +18: [2023-05-13 03:28:21,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +18: [2023-05-13 03:28:21,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +18: [2023-05-13 03:28:21,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +18: [2023-05-13 03:28:21,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +20: [2023-05-13 03:28:21,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +20: [2023-05-13 03:28:21,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +20: [2023-05-13 03:28:21,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +20: [2023-05-13 03:28:21,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +20: [2023-05-13 03:28:21,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +20: [2023-05-13 03:28:21,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +23: [2023-05-13 03:28:21,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +23: [2023-05-13 03:28:21,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +23: [2023-05-13 03:28:21,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +23: [2023-05-13 03:28:21,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +10: [2023-05-13 03:28:21,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +23: [2023-05-13 03:28:21,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +23: [2023-05-13 03:28:21,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +23: [2023-05-13 03:28:21,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +10: [2023-05-13 03:28:21,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +23: [2023-05-13 03:28:21,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +10: [2023-05-13 03:28:21,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +11: [2023-05-13 03:28:21,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +10: [2023-05-13 03:28:21,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +10: [2023-05-13 03:28:21,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +10: [2023-05-13 03:28:21,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +10: [2023-05-13 03:28:21,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +10: [2023-05-13 03:28:21,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +30: [2023-05-13 03:28:21,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +30: [2023-05-13 03:28:21,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +30: [2023-05-13 03:28:21,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +30: [2023-05-13 03:28:21,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +30: [2023-05-13 03:28:21,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +30: [2023-05-13 03:28:21,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +30: [2023-05-13 03:28:21,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +30: [2023-05-13 03:28:21,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +24: [2023-05-13 03:28:21,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +24: [2023-05-13 03:28:21,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +24: [2023-05-13 03:28:21,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +15: [2023-05-13 03:28:21,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +30: [2023-05-13 03:28:21,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +30: [2023-05-13 03:28:21,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +30: [2023-05-13 03:28:21,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +30: [2023-05-13 03:28:21,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +30: [2023-05-13 03:28:21,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +10: [2023-05-13 03:28:21,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +30: [2023-05-13 03:28:21,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +30: [2023-05-13 03:28:21,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +30: [2023-05-13 03:28:21,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +11: [2023-05-13 03:28:21,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +24: [2023-05-13 03:28:21,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +23: [2023-05-13 03:28:21,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +23: [2023-05-13 03:28:21,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +23: [2023-05-13 03:28:21,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +23: [2023-05-13 03:28:21,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +23: [2023-05-13 03:28:21,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +24: [2023-05-13 03:28:21,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +24: [2023-05-13 03:28:21,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +24: [2023-05-13 03:28:21,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +24: [2023-05-13 03:28:21,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +23: [2023-05-13 03:28:21,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +10: [2023-05-13 03:28:21,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +10: [2023-05-13 03:28:21,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +11: [2023-05-13 03:28:21,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +11: [2023-05-13 03:28:21,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +11: [2023-05-13 03:28:21,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +10: [2023-05-13 03:28:21,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +10: [2023-05-13 03:28:21,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +18: [2023-05-13 03:28:21,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +18: [2023-05-13 03:28:21,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +18: [2023-05-13 03:28:21,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +10: [2023-05-13 03:28:21,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +24: [2023-05-13 03:28:21,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +24: [2023-05-13 03:28:21,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +11: [2023-05-13 03:28:21,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +11: [2023-05-13 03:28:21,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +11: [2023-05-13 03:28:21,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +11: [2023-05-13 03:28:21,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +20: [2023-05-13 03:28:21,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +20: [2023-05-13 03:28:21,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +15: [2023-05-13 03:28:21,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +18: [2023-05-13 03:28:21,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +16: [2023-05-13 03:28:21,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +16: [2023-05-13 03:28:21,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +16: [2023-05-13 03:28:21,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +24: [2023-05-13 03:28:21,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +16: [2023-05-13 03:28:21,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +16: [2023-05-13 03:28:21,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +16: [2023-05-13 03:28:21,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +16: [2023-05-13 03:28:21,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +16: [2023-05-13 03:28:21,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +24: [2023-05-13 03:28:21,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +28: [2023-05-13 03:28:21,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +28: [2023-05-13 03:28:21,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +28: [2023-05-13 03:28:21,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +28: [2023-05-13 03:28:21,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +28: [2023-05-13 03:28:21,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +28: [2023-05-13 03:28:21,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +28: [2023-05-13 03:28:21,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +28: [2023-05-13 03:28:21,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +15: [2023-05-13 03:28:21,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +15: [2023-05-13 03:28:21,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +15: [2023-05-13 03:28:21,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +15: [2023-05-13 03:28:21,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +15: [2023-05-13 03:28:21,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +15: [2023-05-13 03:28:21,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +15: [2023-05-13 03:28:21,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +16: [2023-05-13 03:28:21,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +18: [2023-05-13 03:28:21,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +18: [2023-05-13 03:28:21,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +18: [2023-05-13 03:28:21,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +18: [2023-05-13 03:28:21,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +24: [2023-05-13 03:28:21,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +16: [2023-05-13 03:28:21,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +16: [2023-05-13 03:28:21,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +26: [2023-05-13 03:28:21,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +26: [2023-05-13 03:28:21,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +16: [2023-05-13 03:28:21,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +26: [2023-05-13 03:28:21,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +16: [2023-05-13 03:28:21,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +26: [2023-05-13 03:28:21,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +26: [2023-05-13 03:28:21,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +26: [2023-05-13 03:28:21,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +26: [2023-05-13 03:28:21,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +26: [2023-05-13 03:28:21,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +24: [2023-05-13 03:28:21,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +24: [2023-05-13 03:28:21,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +16: [2023-05-13 03:28:21,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +16: [2023-05-13 03:28:21,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +24: [2023-05-13 03:28:21,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +16: [2023-05-13 03:28:21,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:21,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +14: [2023-05-13 03:28:21,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +14: [2023-05-13 03:28:21,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +14: [2023-05-13 03:28:21,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +14: [2023-05-13 03:28:21,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +14: [2023-05-13 03:28:21,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +14: [2023-05-13 03:28:21,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +14: [2023-05-13 03:28:21,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +28: [2023-05-13 03:28:21,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +26: [2023-05-13 03:28:21,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +20: [2023-05-13 03:28:21,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +20: [2023-05-13 03:28:21,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +26: [2023-05-13 03:28:21,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +20: [2023-05-13 03:28:21,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +26: [2023-05-13 03:28:21,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +20: [2023-05-13 03:28:21,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +20: [2023-05-13 03:28:21,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +20: [2023-05-13 03:28:21,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +18: [2023-05-13 03:28:21,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +14: [2023-05-13 03:28:21,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:21,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +28: [2023-05-13 03:28:21,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +28: [2023-05-13 03:28:21,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +11: [2023-05-13 03:28:21,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +14: [2023-05-13 03:28:21,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +28: [2023-05-13 03:28:21,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +26: [2023-05-13 03:28:21,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:21,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +26: [2023-05-13 03:28:21,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +28: [2023-05-13 03:28:21,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:21,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +28: [2023-05-13 03:28:21,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +11: [2023-05-13 03:28:21,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +26: [2023-05-13 03:28:21,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:21,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +11: [2023-05-13 03:28:21,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +26: [2023-05-13 03:28:21,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:21,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +28: [2023-05-13 03:28:21,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +18: [2023-05-13 03:28:21,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:21,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +18: [2023-05-13 03:28:21,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +28: [2023-05-13 03:28:21,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +26: [2023-05-13 03:28:21,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +20: [2023-05-13 03:28:21,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +20: [2023-05-13 03:28:21,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +11: [2023-05-13 03:28:21,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +11: [2023-05-13 03:28:21,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +11: [2023-05-13 03:28:21,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +11: [2023-05-13 03:28:21,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +18: [2023-05-13 03:28:21,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +30: [2023-05-13 03:28:21,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +30: [2023-05-13 03:28:21,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +30: [2023-05-13 03:28:21,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +17: [2023-05-13 03:28:21,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +17: [2023-05-13 03:28:21,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +17: [2023-05-13 03:28:21,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +17: [2023-05-13 03:28:21,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +17: [2023-05-13 03:28:21,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +17: [2023-05-13 03:28:21,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +17: [2023-05-13 03:28:21,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +17: [2023-05-13 03:28:21,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +30: [2023-05-13 03:28:21,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +17: [2023-05-13 03:28:21,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +15: [2023-05-13 03:28:21,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +18: [2023-05-13 03:28:21,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +15: [2023-05-13 03:28:21,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +18: [2023-05-13 03:28:21,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +15: [2023-05-13 03:28:21,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +15: [2023-05-13 03:28:21,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +15: [2023-05-13 03:28:21,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +15: [2023-05-13 03:28:21,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +18: [2023-05-13 03:28:21,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +18: [2023-05-13 03:28:21,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +30: [2023-05-13 03:28:21,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +30: [2023-05-13 03:28:21,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +30: [2023-05-13 03:28:21,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +30: [2023-05-13 03:28:21,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +17: [2023-05-13 03:28:21,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +15: [2023-05-13 03:28:21,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +17: [2023-05-13 03:28:21,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +17: [2023-05-13 03:28:21,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +17: [2023-05-13 03:28:21,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +17: [2023-05-13 03:28:21,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +20: [2023-05-13 03:28:21,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +17: [2023-05-13 03:28:21,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +17: [2023-05-13 03:28:21,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +22: [2023-05-13 03:28:21,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +22: [2023-05-13 03:28:21,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +22: [2023-05-13 03:28:21,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +22: [2023-05-13 03:28:21,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +22: [2023-05-13 03:28:21,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +22: [2023-05-13 03:28:21,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +22: [2023-05-13 03:28:21,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +20: [2023-05-13 03:28:21,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +20: [2023-05-13 03:28:21,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +22: [2023-05-13 03:28:21,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +20: [2023-05-13 03:28:21,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +20: [2023-05-13 03:28:21,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +20: [2023-05-13 03:28:21,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +30: [2023-05-13 03:28:21,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +30: [2023-05-13 03:28:21,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +22: [2023-05-13 03:28:21,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +22: [2023-05-13 03:28:21,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +22: [2023-05-13 03:28:21,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +22: [2023-05-13 03:28:21,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +22: [2023-05-13 03:28:21,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +22: [2023-05-13 03:28:21,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +22: [2023-05-13 03:28:21,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +22: [2023-05-13 03:28:21,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +30: [2023-05-13 03:28:21,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +30: [2023-05-13 03:28:21,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +28: [2023-05-13 03:28:21,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +16: [2023-05-13 03:28:21,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +16: [2023-05-13 03:28:21,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +13: [2023-05-13 03:28:21,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +13: [2023-05-13 03:28:21,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +13: [2023-05-13 03:28:21,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +13: [2023-05-13 03:28:21,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +13: [2023-05-13 03:28:21,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +13: [2023-05-13 03:28:21,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +13: [2023-05-13 03:28:21,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +13: [2023-05-13 03:28:21,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +26: [2023-05-13 03:28:21,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +26: [2023-05-13 03:28:21,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +26: [2023-05-13 03:28:21,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:21,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +14: [2023-05-13 03:28:21,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +16: [2023-05-13 03:28:21,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +16: [2023-05-13 03:28:21,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +16: [2023-05-13 03:28:21,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +16: [2023-05-13 03:28:21,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +16: [2023-05-13 03:28:21,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +16: [2023-05-13 03:28:21,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +14: [2023-05-13 03:28:21,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +30: [2023-05-13 03:28:21,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +30: [2023-05-13 03:28:21,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +13: [2023-05-13 03:28:21,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +13: [2023-05-13 03:28:21,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +13: [2023-05-13 03:28:21,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +13: [2023-05-13 03:28:21,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +13: [2023-05-13 03:28:21,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +30: [2023-05-13 03:28:21,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +30: [2023-05-13 03:28:21,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +13: [2023-05-13 03:28:21,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +13: [2023-05-13 03:28:21,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +13: [2023-05-13 03:28:21,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:21,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +26: [2023-05-13 03:28:21,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +26: [2023-05-13 03:28:21,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +26: [2023-05-13 03:28:21,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +26: [2023-05-13 03:28:21,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +26: [2023-05-13 03:28:21,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +17: [2023-05-13 03:28:21,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +14: [2023-05-13 03:28:21,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +14: [2023-05-13 03:28:21,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +14: [2023-05-13 03:28:21,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +14: [2023-05-13 03:28:21,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +28: [2023-05-13 03:28:21,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +16: [2023-05-13 03:28:21,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +28: [2023-05-13 03:28:21,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +28: [2023-05-13 03:28:21,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +28: [2023-05-13 03:28:21,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +16: [2023-05-13 03:28:21,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +28: [2023-05-13 03:28:21,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +28: [2023-05-13 03:28:21,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +28: [2023-05-13 03:28:21,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +28: [2023-05-13 03:28:21,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +14: [2023-05-13 03:28:21,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +14: [2023-05-13 03:28:21,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +26: [2023-05-13 03:28:21,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +26: [2023-05-13 03:28:21,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +29: [2023-05-13 03:28:21,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +29: [2023-05-13 03:28:21,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +14: [2023-05-13 03:28:21,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +26: [2023-05-13 03:28:21,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +16: [2023-05-13 03:28:21,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +16: [2023-05-13 03:28:21,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +16: [2023-05-13 03:28:21,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +29: [2023-05-13 03:28:21,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +29: [2023-05-13 03:28:21,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +16: [2023-05-13 03:28:21,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +29: [2023-05-13 03:28:21,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +29: [2023-05-13 03:28:21,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +29: [2023-05-13 03:28:21,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +29: [2023-05-13 03:28:21,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +29: [2023-05-13 03:28:21,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +29: [2023-05-13 03:28:21,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +16: [2023-05-13 03:28:21,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +16: [2023-05-13 03:28:21,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +17: [2023-05-13 03:28:21,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +14: [2023-05-13 03:28:21,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +29: [2023-05-13 03:28:21,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +22: [2023-05-13 03:28:21,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +22: [2023-05-13 03:28:21,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +26: [2023-05-13 03:28:21,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +26: [2023-05-13 03:28:21,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +26: [2023-05-13 03:28:21,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +29: [2023-05-13 03:28:21,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:21,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +26: [2023-05-13 03:28:21,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +29: [2023-05-13 03:28:21,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:21,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +14: [2023-05-13 03:28:21,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +29: [2023-05-13 03:28:21,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +14: [2023-05-13 03:28:21,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +29: [2023-05-13 03:28:21,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +29: [2023-05-13 03:28:21,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +26: [2023-05-13 03:28:21,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +17: [2023-05-13 03:28:21,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +17: [2023-05-13 03:28:21,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +17: [2023-05-13 03:28:21,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +17: [2023-05-13 03:28:21,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +17: [2023-05-13 03:28:21,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +17: [2023-05-13 03:28:21,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +17: [2023-05-13 03:28:21,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +28: [2023-05-13 03:28:21,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +28: [2023-05-13 03:28:21,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +31: [2023-05-13 03:28:21,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +31: [2023-05-13 03:28:21,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +22: [2023-05-13 03:28:21,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +22: [2023-05-13 03:28:21,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +28: [2023-05-13 03:28:21,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +28: [2023-05-13 03:28:21,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +25: [2023-05-13 03:28:21,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +25: [2023-05-13 03:28:21,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +31: [2023-05-13 03:28:21,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +31: [2023-05-13 03:28:21,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +31: [2023-05-13 03:28:21,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +31: [2023-05-13 03:28:21,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +31: [2023-05-13 03:28:21,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +31: [2023-05-13 03:28:21,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +25: [2023-05-13 03:28:21,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +25: [2023-05-13 03:28:21,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +13: [2023-05-13 03:28:21,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +25: [2023-05-13 03:28:21,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +25: [2023-05-13 03:28:21,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +25: [2023-05-13 03:28:21,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +25: [2023-05-13 03:28:21,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +13: [2023-05-13 03:28:21,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +13: [2023-05-13 03:28:21,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +31: [2023-05-13 03:28:21,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +31: [2023-05-13 03:28:21,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +22: [2023-05-13 03:28:21,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +22: [2023-05-13 03:28:21,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +22: [2023-05-13 03:28:21,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +22: [2023-05-13 03:28:21,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +28: [2023-05-13 03:28:21,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +28: [2023-05-13 03:28:21,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +28: [2023-05-13 03:28:21,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +25: [2023-05-13 03:28:21,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +25: [2023-05-13 03:28:21,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +25: [2023-05-13 03:28:21,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +22: [2023-05-13 03:28:21,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +22: [2023-05-13 03:28:21,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +25: [2023-05-13 03:28:21,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +25: [2023-05-13 03:28:21,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +25: [2023-05-13 03:28:21,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +25: [2023-05-13 03:28:21,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +25: [2023-05-13 03:28:21,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +13: [2023-05-13 03:28:21,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +31: [2023-05-13 03:28:21,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +31: [2023-05-13 03:28:21,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +31: [2023-05-13 03:28:21,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +31: [2023-05-13 03:28:21,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +31: [2023-05-13 03:28:21,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +31: [2023-05-13 03:28:21,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +13: [2023-05-13 03:28:21,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +13: [2023-05-13 03:28:21,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +13: [2023-05-13 03:28:21,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +13: [2023-05-13 03:28:21,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +12: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +12: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +12: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +19: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +19: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +12: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +12: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +12: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +12: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +19: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +19: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +12: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +19: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +19: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +19: [2023-05-13 03:28:21,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +19: [2023-05-13 03:28:21,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +12: [2023-05-13 03:28:21,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +12: [2023-05-13 03:28:21,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +12: [2023-05-13 03:28:21,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +12: [2023-05-13 03:28:21,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +12: [2023-05-13 03:28:21,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 1: [2023-05-13 03:28:21,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 1: [2023-05-13 03:28:21,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +19: [2023-05-13 03:28:21,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +17: [2023-05-13 03:28:21,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 1: [2023-05-13 03:28:21,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +12: [2023-05-13 03:28:21,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 1: [2023-05-13 03:28:21,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +12: [2023-05-13 03:28:21,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 1: [2023-05-13 03:28:21,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +12: [2023-05-13 03:28:21,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +19: [2023-05-13 03:28:21,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +19: [2023-05-13 03:28:21,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +19: [2023-05-13 03:28:21,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 1: [2023-05-13 03:28:21,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +19: [2023-05-13 03:28:21,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 1: [2023-05-13 03:28:21,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 1: [2023-05-13 03:28:21,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +19: [2023-05-13 03:28:21,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +13: [2023-05-13 03:28:21,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +19: [2023-05-13 03:28:21,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +19: [2023-05-13 03:28:21,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +29: [2023-05-13 03:28:21,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +22: [2023-05-13 03:28:21,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +13: [2023-05-13 03:28:21,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +13: [2023-05-13 03:28:21,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +17: [2023-05-13 03:28:21,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +22: [2023-05-13 03:28:21,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +17: [2023-05-13 03:28:21,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +29: [2023-05-13 03:28:21,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +17: [2023-05-13 03:28:21,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +17: [2023-05-13 03:28:21,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +17: [2023-05-13 03:28:21,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +17: [2023-05-13 03:28:21,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +22: [2023-05-13 03:28:21,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +22: [2023-05-13 03:28:21,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +22: [2023-05-13 03:28:21,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +22: [2023-05-13 03:28:21,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +27: [2023-05-13 03:28:21,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +27: [2023-05-13 03:28:21,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +27: [2023-05-13 03:28:21,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +27: [2023-05-13 03:28:21,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +27: [2023-05-13 03:28:21,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +27: [2023-05-13 03:28:21,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +27: [2023-05-13 03:28:21,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +27: [2023-05-13 03:28:21,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +13: [2023-05-13 03:28:21,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +13: [2023-05-13 03:28:21,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +27: [2023-05-13 03:28:21,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +13: [2023-05-13 03:28:21,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +13: [2023-05-13 03:28:21,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +13: [2023-05-13 03:28:21,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +29: [2023-05-13 03:28:21,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +29: [2023-05-13 03:28:21,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +27: [2023-05-13 03:28:21,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +29: [2023-05-13 03:28:21,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +27: [2023-05-13 03:28:21,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +27: [2023-05-13 03:28:21,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +29: [2023-05-13 03:28:21,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +29: [2023-05-13 03:28:21,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +27: [2023-05-13 03:28:21,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +31: [2023-05-13 03:28:21,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +31: [2023-05-13 03:28:21,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +27: [2023-05-13 03:28:21,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +27: [2023-05-13 03:28:21,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +27: [2023-05-13 03:28:21,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +29: [2023-05-13 03:28:21,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +29: [2023-05-13 03:28:21,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +29: [2023-05-13 03:28:21,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +25: [2023-05-13 03:28:21,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +25: [2023-05-13 03:28:21,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +25: [2023-05-13 03:28:21,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt... +25: [2023-05-13 03:28:21,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +25: [2023-05-13 03:28:21,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +25: [2023-05-13 03:28:21,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +25: [2023-05-13 03:28:21,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +25: [2023-05-13 03:28:21,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +31: [2023-05-13 03:28:21,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +31: [2023-05-13 03:28:21,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +12: [2023-05-13 03:28:21,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +12: [2023-05-13 03:28:21,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +19: [2023-05-13 03:28:21,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +29: [2023-05-13 03:28:21,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +31: [2023-05-13 03:28:21,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +31: [2023-05-13 03:28:21,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +31: [2023-05-13 03:28:21,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +19: [2023-05-13 03:28:21,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +19: [2023-05-13 03:28:21,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +12: [2023-05-13 03:28:21,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +29: [2023-05-13 03:28:21,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +21: [2023-05-13 03:28:21,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +21: [2023-05-13 03:28:21,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +21: [2023-05-13 03:28:21,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +21: [2023-05-13 03:28:21,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +21: [2023-05-13 03:28:21,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +21: [2023-05-13 03:28:21,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +21: [2023-05-13 03:28:21,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +21: [2023-05-13 03:28:21,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +31: [2023-05-13 03:28:21,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +31: [2023-05-13 03:28:21,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +31: [2023-05-13 03:28:21,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +29: [2023-05-13 03:28:21,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +29: [2023-05-13 03:28:21,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +21: [2023-05-13 03:28:21,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +21: [2023-05-13 03:28:21,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +21: [2023-05-13 03:28:21,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +29: [2023-05-13 03:28:21,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +29: [2023-05-13 03:28:21,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +25: [2023-05-13 03:28:21,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +25: [2023-05-13 03:28:21,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +12: [2023-05-13 03:28:21,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +12: [2023-05-13 03:28:21,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +12: [2023-05-13 03:28:21,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +12: [2023-05-13 03:28:21,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +12: [2023-05-13 03:28:21,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +19: [2023-05-13 03:28:21,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +19: [2023-05-13 03:28:21,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +19: [2023-05-13 03:28:21,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +19: [2023-05-13 03:28:21,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +19: [2023-05-13 03:28:21,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +21: [2023-05-13 03:28:21,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +21: [2023-05-13 03:28:21,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +21: [2023-05-13 03:28:21,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +21: [2023-05-13 03:28:21,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +21: [2023-05-13 03:28:21,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +25: [2023-05-13 03:28:21,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +27: [2023-05-13 03:28:21,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +12: [2023-05-13 03:28:21,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +12: [2023-05-13 03:28:21,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +25: [2023-05-13 03:28:21,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +25: [2023-05-13 03:28:21,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +25: [2023-05-13 03:28:21,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +25: [2023-05-13 03:28:21,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +25: [2023-05-13 03:28:21,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +19: [2023-05-13 03:28:21,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +19: [2023-05-13 03:28:21,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +19: [2023-05-13 03:28:21,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 1: [2023-05-13 03:28:21,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 1: [2023-05-13 03:28:21,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 1: [2023-05-13 03:28:21,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 1: [2023-05-13 03:28:21,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +12: [2023-05-13 03:28:21,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +27: [2023-05-13 03:28:21,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +19: [2023-05-13 03:28:21,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +10: [2023-05-13 03:28:21,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +10: [2023-05-13 03:28:21,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +10: [2023-05-13 03:28:21,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +10: [2023-05-13 03:28:21,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +10: [2023-05-13 03:28:21,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +10: [2023-05-13 03:28:21,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +10: [2023-05-13 03:28:21,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +10: [2023-05-13 03:28:21,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +19: [2023-05-13 03:28:21,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +31: [2023-05-13 03:28:21,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +31: [2023-05-13 03:28:21,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +31: [2023-05-13 03:28:21,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +31: [2023-05-13 03:28:21,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +31: [2023-05-13 03:28:21,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +31: [2023-05-13 03:28:21,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +12: [2023-05-13 03:28:21,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +27: [2023-05-13 03:28:21,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +27: [2023-05-13 03:28:21,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +19: [2023-05-13 03:28:21,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +12: [2023-05-13 03:28:21,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +19: [2023-05-13 03:28:21,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +19: [2023-05-13 03:28:21,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +10: [2023-05-13 03:28:21,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +10: [2023-05-13 03:28:21,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +12: [2023-05-13 03:28:21,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +12: [2023-05-13 03:28:21,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +12: [2023-05-13 03:28:21,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +10: [2023-05-13 03:28:21,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +10: [2023-05-13 03:28:21,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +10: [2023-05-13 03:28:21,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +10: [2023-05-13 03:28:21,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +10: [2023-05-13 03:28:21,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +10: [2023-05-13 03:28:21,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +27: [2023-05-13 03:28:21,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +27: [2023-05-13 03:28:21,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +27: [2023-05-13 03:28:21,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +27: [2023-05-13 03:28:21,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +27: [2023-05-13 03:28:21,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_04-model_00-model_states.pt. +21: [2023-05-13 03:28:21,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +21: [2023-05-13 03:28:21,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +21: [2023-05-13 03:28:21,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +21: [2023-05-13 03:28:21,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +21: [2023-05-13 03:28:21,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 1: [2023-05-13 03:28:21,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 1: [2023-05-13 03:28:21,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +27: [2023-05-13 03:28:21,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +21: [2023-05-13 03:28:21,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +11: [2023-05-13 03:28:21,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +27: [2023-05-13 03:28:21,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +11: [2023-05-13 03:28:21,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +11: [2023-05-13 03:28:21,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +11: [2023-05-13 03:28:21,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +11: [2023-05-13 03:28:21,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +11: [2023-05-13 03:28:21,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +11: [2023-05-13 03:28:21,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +11: [2023-05-13 03:28:21,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +21: [2023-05-13 03:28:21,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +21: [2023-05-13 03:28:21,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +11: [2023-05-13 03:28:21,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +21: [2023-05-13 03:28:21,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +15: [2023-05-13 03:28:21,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +21: [2023-05-13 03:28:21,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +15: [2023-05-13 03:28:21,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +15: [2023-05-13 03:28:21,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +15: [2023-05-13 03:28:21,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +21: [2023-05-13 03:28:21,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +15: [2023-05-13 03:28:21,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +15: [2023-05-13 03:28:21,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +15: [2023-05-13 03:28:21,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +15: [2023-05-13 03:28:21,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +27: [2023-05-13 03:28:21,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +11: [2023-05-13 03:28:21,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +11: [2023-05-13 03:28:21,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +27: [2023-05-13 03:28:21,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +27: [2023-05-13 03:28:21,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +15: [2023-05-13 03:28:21,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +11: [2023-05-13 03:28:21,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +11: [2023-05-13 03:28:21,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +11: [2023-05-13 03:28:21,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +11: [2023-05-13 03:28:21,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +11: [2023-05-13 03:28:21,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +27: [2023-05-13 03:28:21,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +27: [2023-05-13 03:28:21,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +15: [2023-05-13 03:28:21,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +15: [2023-05-13 03:28:21,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +10: [2023-05-13 03:28:21,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +10: [2023-05-13 03:28:21,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +15: [2023-05-13 03:28:21,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +15: [2023-05-13 03:28:21,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +15: [2023-05-13 03:28:21,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +21: [2023-05-13 03:28:21,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +15: [2023-05-13 03:28:21,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +15: [2023-05-13 03:28:21,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +21: [2023-05-13 03:28:21,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +24: [2023-05-13 03:28:21,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +24: [2023-05-13 03:28:21,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +24: [2023-05-13 03:28:21,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +24: [2023-05-13 03:28:21,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +24: [2023-05-13 03:28:21,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +24: [2023-05-13 03:28:21,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +24: [2023-05-13 03:28:21,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +24: [2023-05-13 03:28:21,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +21: [2023-05-13 03:28:21,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +21: [2023-05-13 03:28:21,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +21: [2023-05-13 03:28:21,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +24: [2023-05-13 03:28:21,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +24: [2023-05-13 03:28:21,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +24: [2023-05-13 03:28:21,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +24: [2023-05-13 03:28:21,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +24: [2023-05-13 03:28:21,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +24: [2023-05-13 03:28:21,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +24: [2023-05-13 03:28:21,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +24: [2023-05-13 03:28:21,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +30: [2023-05-13 03:28:21,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +30: [2023-05-13 03:28:21,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +30: [2023-05-13 03:28:21,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +30: [2023-05-13 03:28:21,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +30: [2023-05-13 03:28:21,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +30: [2023-05-13 03:28:21,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +30: [2023-05-13 03:28:21,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +30: [2023-05-13 03:28:21,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +10: [2023-05-13 03:28:21,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +10: [2023-05-13 03:28:21,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +10: [2023-05-13 03:28:21,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +30: [2023-05-13 03:28:21,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +30: [2023-05-13 03:28:21,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +30: [2023-05-13 03:28:21,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +30: [2023-05-13 03:28:21,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +30: [2023-05-13 03:28:21,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +10: [2023-05-13 03:28:21,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +10: [2023-05-13 03:28:21,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +10: [2023-05-13 03:28:21,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +10: [2023-05-13 03:28:21,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +10: [2023-05-13 03:28:21,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +30: [2023-05-13 03:28:21,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +30: [2023-05-13 03:28:21,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +30: [2023-05-13 03:28:21,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +11: [2023-05-13 03:28:21,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +15: [2023-05-13 03:28:21,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +10: [2023-05-13 03:28:21,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +18: [2023-05-13 03:28:21,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +18: [2023-05-13 03:28:21,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +18: [2023-05-13 03:28:21,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +18: [2023-05-13 03:28:21,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +18: [2023-05-13 03:28:21,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +18: [2023-05-13 03:28:21,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +18: [2023-05-13 03:28:21,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +18: [2023-05-13 03:28:21,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +11: [2023-05-13 03:28:21,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +10: [2023-05-13 03:28:21,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +10: [2023-05-13 03:28:21,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +10: [2023-05-13 03:28:21,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +10: [2023-05-13 03:28:21,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +18: [2023-05-13 03:28:21,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +18: [2023-05-13 03:28:21,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +18: [2023-05-13 03:28:21,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +10: [2023-05-13 03:28:21,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +18: [2023-05-13 03:28:21,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 9: [2023-05-13 03:28:21,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +18: [2023-05-13 03:28:21,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +18: [2023-05-13 03:28:21,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +18: [2023-05-13 03:28:21,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +18: [2023-05-13 03:28:21,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +11: [2023-05-13 03:28:21,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +11: [2023-05-13 03:28:21,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +11: [2023-05-13 03:28:21,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +15: [2023-05-13 03:28:21,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +24: [2023-05-13 03:28:21,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +24: [2023-05-13 03:28:21,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +11: [2023-05-13 03:28:21,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +11: [2023-05-13 03:28:21,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +11: [2023-05-13 03:28:21,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +11: [2023-05-13 03:28:21,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +24: [2023-05-13 03:28:21,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +15: [2023-05-13 03:28:21,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +15: [2023-05-13 03:28:21,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +15: [2023-05-13 03:28:21,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +15: [2023-05-13 03:28:21,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +15: [2023-05-13 03:28:21,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +15: [2023-05-13 03:28:21,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +15: [2023-05-13 03:28:21,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +24: [2023-05-13 03:28:21,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +30: [2023-05-13 03:28:21,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +30: [2023-05-13 03:28:21,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +30: [2023-05-13 03:28:21,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +24: [2023-05-13 03:28:21,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +24: [2023-05-13 03:28:21,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +24: [2023-05-13 03:28:21,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +24: [2023-05-13 03:28:21,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +30: [2023-05-13 03:28:21,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +30: [2023-05-13 03:28:21,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +30: [2023-05-13 03:28:21,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +30: [2023-05-13 03:28:21,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +30: [2023-05-13 03:28:21,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +24: [2023-05-13 03:28:21,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +24: [2023-05-13 03:28:21,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +11: [2023-05-13 03:28:21,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +24: [2023-05-13 03:28:21,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +11: [2023-05-13 03:28:21,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +11: [2023-05-13 03:28:21,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +11: [2023-05-13 03:28:21,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +30: [2023-05-13 03:28:21,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 9: [2023-05-13 03:28:21,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +24: [2023-05-13 03:28:21,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +11: [2023-05-13 03:28:21,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +11: [2023-05-13 03:28:21,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +11: [2023-05-13 03:28:21,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +30: [2023-05-13 03:28:21,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +30: [2023-05-13 03:28:21,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +24: [2023-05-13 03:28:21,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +30: [2023-05-13 03:28:21,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +15: [2023-05-13 03:28:21,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +24: [2023-05-13 03:28:21,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +24: [2023-05-13 03:28:21,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +15: [2023-05-13 03:28:21,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +24: [2023-05-13 03:28:21,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +15: [2023-05-13 03:28:21,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +18: [2023-05-13 03:28:21,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +18: [2023-05-13 03:28:21,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +18: [2023-05-13 03:28:21,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +15: [2023-05-13 03:28:21,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +15: [2023-05-13 03:28:21,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +30: [2023-05-13 03:28:21,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +30: [2023-05-13 03:28:21,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +15: [2023-05-13 03:28:21,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +15: [2023-05-13 03:28:21,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +30: [2023-05-13 03:28:21,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +30: [2023-05-13 03:28:21,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +18: [2023-05-13 03:28:21,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +17: [2023-05-13 03:28:21,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +17: [2023-05-13 03:28:21,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +17: [2023-05-13 03:28:21,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +17: [2023-05-13 03:28:21,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +17: [2023-05-13 03:28:21,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +17: [2023-05-13 03:28:21,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +17: [2023-05-13 03:28:21,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +17: [2023-05-13 03:28:21,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +18: [2023-05-13 03:28:21,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +18: [2023-05-13 03:28:21,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +18: [2023-05-13 03:28:21,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +18: [2023-05-13 03:28:21,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +17: [2023-05-13 03:28:21,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +22: [2023-05-13 03:28:21,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +22: [2023-05-13 03:28:21,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +22: [2023-05-13 03:28:21,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +22: [2023-05-13 03:28:21,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +22: [2023-05-13 03:28:21,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +22: [2023-05-13 03:28:21,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +22: [2023-05-13 03:28:21,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +22: [2023-05-13 03:28:21,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +13: [2023-05-13 03:28:21,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +13: [2023-05-13 03:28:21,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +28: [2023-05-13 03:28:21,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +28: [2023-05-13 03:28:21,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +28: [2023-05-13 03:28:21,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +28: [2023-05-13 03:28:21,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +28: [2023-05-13 03:28:21,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +28: [2023-05-13 03:28:21,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +28: [2023-05-13 03:28:21,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +28: [2023-05-13 03:28:21,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +26: [2023-05-13 03:28:21,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +26: [2023-05-13 03:28:21,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +26: [2023-05-13 03:28:21,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +13: [2023-05-13 03:28:21,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +13: [2023-05-13 03:28:21,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +14: [2023-05-13 03:28:21,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +14: [2023-05-13 03:28:21,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +13: [2023-05-13 03:28:21,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +13: [2023-05-13 03:28:21,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +13: [2023-05-13 03:28:21,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +26: [2023-05-13 03:28:21,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +26: [2023-05-13 03:28:21,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +26: [2023-05-13 03:28:21,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +26: [2023-05-13 03:28:21,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +26: [2023-05-13 03:28:21,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +13: [2023-05-13 03:28:21,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +18: [2023-05-13 03:28:21,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +18: [2023-05-13 03:28:21,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +14: [2023-05-13 03:28:21,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +16: [2023-05-13 03:28:21,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +16: [2023-05-13 03:28:21,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +18: [2023-05-13 03:28:21,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +14: [2023-05-13 03:28:21,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +28: [2023-05-13 03:28:21,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +23: [2023-05-13 03:28:21,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +23: [2023-05-13 03:28:21,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +23: [2023-05-13 03:28:21,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +23: [2023-05-13 03:28:21,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +13: [2023-05-13 03:28:21,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +13: [2023-05-13 03:28:21,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +17: [2023-05-13 03:28:21,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +17: [2023-05-13 03:28:21,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +16: [2023-05-13 03:28:21,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +16: [2023-05-13 03:28:21,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +17: [2023-05-13 03:28:21,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +23: [2023-05-13 03:28:21,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +23: [2023-05-13 03:28:21,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +23: [2023-05-13 03:28:21,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +23: [2023-05-13 03:28:21,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +16: [2023-05-13 03:28:21,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +16: [2023-05-13 03:28:21,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +16: [2023-05-13 03:28:21,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +16: [2023-05-13 03:28:21,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +17: [2023-05-13 03:28:21,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +17: [2023-05-13 03:28:21,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +26: [2023-05-13 03:28:21,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +26: [2023-05-13 03:28:21,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +26: [2023-05-13 03:28:21,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +22: [2023-05-13 03:28:21,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +22: [2023-05-13 03:28:21,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +17: [2023-05-13 03:28:21,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +17: [2023-05-13 03:28:21,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +13: [2023-05-13 03:28:21,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +13: [2023-05-13 03:28:21,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +13: [2023-05-13 03:28:21,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +13: [2023-05-13 03:28:21,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +23: [2023-05-13 03:28:21,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +13: [2023-05-13 03:28:21,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +26: [2023-05-13 03:28:21,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +26: [2023-05-13 03:28:21,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +16: [2023-05-13 03:28:21,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +23: [2023-05-13 03:28:21,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +16: [2023-05-13 03:28:21,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +13: [2023-05-13 03:28:21,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +18: [2023-05-13 03:28:21,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +16: [2023-05-13 03:28:21,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +22: [2023-05-13 03:28:21,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +26: [2023-05-13 03:28:21,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +26: [2023-05-13 03:28:21,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +26: [2023-05-13 03:28:21,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +22: [2023-05-13 03:28:21,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +16: [2023-05-13 03:28:21,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +28: [2023-05-13 03:28:21,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +16: [2023-05-13 03:28:21,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +16: [2023-05-13 03:28:21,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +28: [2023-05-13 03:28:21,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +28: [2023-05-13 03:28:21,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +23: [2023-05-13 03:28:21,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +23: [2023-05-13 03:28:21,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +22: [2023-05-13 03:28:21,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +28: [2023-05-13 03:28:21,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +22: [2023-05-13 03:28:21,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +23: [2023-05-13 03:28:21,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +23: [2023-05-13 03:28:21,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +28: [2023-05-13 03:28:21,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +23: [2023-05-13 03:28:21,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +16: [2023-05-13 03:28:21,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +16: [2023-05-13 03:28:21,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +22: [2023-05-13 03:28:21,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +28: [2023-05-13 03:28:21,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +22: [2023-05-13 03:28:21,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +28: [2023-05-13 03:28:21,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +23: [2023-05-13 03:28:21,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +18: [2023-05-13 03:28:21,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +18: [2023-05-13 03:28:21,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +18: [2023-05-13 03:28:21,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +18: [2023-05-13 03:28:21,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +20: [2023-05-13 03:28:21,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +20: [2023-05-13 03:28:21,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +20: [2023-05-13 03:28:21,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +20: [2023-05-13 03:28:21,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +20: [2023-05-13 03:28:21,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +20: [2023-05-13 03:28:21,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +20: [2023-05-13 03:28:21,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +20: [2023-05-13 03:28:21,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +20: [2023-05-13 03:28:21,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +20: [2023-05-13 03:28:21,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 4: [2023-05-13 03:28:21,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 4: [2023-05-13 03:28:21,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +20: [2023-05-13 03:28:21,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +17: [2023-05-13 03:28:21,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +12: [2023-05-13 03:28:21,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +12: [2023-05-13 03:28:21,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +12: [2023-05-13 03:28:21,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +12: [2023-05-13 03:28:21,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +12: [2023-05-13 03:28:21,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +12: [2023-05-13 03:28:21,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +12: [2023-05-13 03:28:21,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +12: [2023-05-13 03:28:21,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +20: [2023-05-13 03:28:21,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +20: [2023-05-13 03:28:21,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +20: [2023-05-13 03:28:21,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +20: [2023-05-13 03:28:21,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +20: [2023-05-13 03:28:21,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +28: [2023-05-13 03:28:21,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +25: [2023-05-13 03:28:21,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +25: [2023-05-13 03:28:21,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +25: [2023-05-13 03:28:21,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +25: [2023-05-13 03:28:21,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +25: [2023-05-13 03:28:21,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +25: [2023-05-13 03:28:21,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +25: [2023-05-13 03:28:21,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +12: [2023-05-13 03:28:21,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +25: [2023-05-13 03:28:21,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +12: [2023-05-13 03:28:21,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +12: [2023-05-13 03:28:21,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +12: [2023-05-13 03:28:21,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +12: [2023-05-13 03:28:21,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +12: [2023-05-13 03:28:21,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +12: [2023-05-13 03:28:21,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +12: [2023-05-13 03:28:21,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +13: [2023-05-13 03:28:21,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +13: [2023-05-13 03:28:21,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +26: [2023-05-13 03:28:21,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +26: [2023-05-13 03:28:21,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +26: [2023-05-13 03:28:21,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +25: [2023-05-13 03:28:21,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +25: [2023-05-13 03:28:21,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +14: [2023-05-13 03:28:21,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +25: [2023-05-13 03:28:21,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +19: [2023-05-13 03:28:21,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +19: [2023-05-13 03:28:21,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +25: [2023-05-13 03:28:21,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +25: [2023-05-13 03:28:21,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +25: [2023-05-13 03:28:21,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +25: [2023-05-13 03:28:21,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +23: [2023-05-13 03:28:21,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +19: [2023-05-13 03:28:21,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +23: [2023-05-13 03:28:21,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +25: [2023-05-13 03:28:21,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +19: [2023-05-13 03:28:21,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +19: [2023-05-13 03:28:21,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +19: [2023-05-13 03:28:21,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +19: [2023-05-13 03:28:21,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +19: [2023-05-13 03:28:21,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +13: [2023-05-13 03:28:21,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +19: [2023-05-13 03:28:21,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +19: [2023-05-13 03:28:21,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +13: [2023-05-13 03:28:21,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +16: [2023-05-13 03:28:21,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +16: [2023-05-13 03:28:21,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +16: [2023-05-13 03:28:21,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +22: [2023-05-13 03:28:21,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +22: [2023-05-13 03:28:21,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +17: [2023-05-13 03:28:21,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +19: [2023-05-13 03:28:21,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +26: [2023-05-13 03:28:21,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +26: [2023-05-13 03:28:21,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +26: [2023-05-13 03:28:21,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +16: [2023-05-13 03:28:21,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +16: [2023-05-13 03:28:21,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +16: [2023-05-13 03:28:21,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +16: [2023-05-13 03:28:21,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +19: [2023-05-13 03:28:21,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +28: [2023-05-13 03:28:21,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +19: [2023-05-13 03:28:21,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +19: [2023-05-13 03:28:21,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +19: [2023-05-13 03:28:21,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +16: [2023-05-13 03:28:21,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +26: [2023-05-13 03:28:21,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +26: [2023-05-13 03:28:21,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +19: [2023-05-13 03:28:21,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +13: [2023-05-13 03:28:21,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +13: [2023-05-13 03:28:21,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +13: [2023-05-13 03:28:21,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +13: [2023-05-13 03:28:21,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +13: [2023-05-13 03:28:21,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +13: [2023-05-13 03:28:21,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +17: [2023-05-13 03:28:21,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +17: [2023-05-13 03:28:21,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +17: [2023-05-13 03:28:21,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +17: [2023-05-13 03:28:21,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +22: [2023-05-13 03:28:21,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +22: [2023-05-13 03:28:21,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +17: [2023-05-13 03:28:21,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +28: [2023-05-13 03:28:21,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +28: [2023-05-13 03:28:21,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +26: [2023-05-13 03:28:21,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +28: [2023-05-13 03:28:21,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +26: [2023-05-13 03:28:21,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +17: [2023-05-13 03:28:21,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +17: [2023-05-13 03:28:21,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +23: [2023-05-13 03:28:21,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +23: [2023-05-13 03:28:21,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +26: [2023-05-13 03:28:21,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +23: [2023-05-13 03:28:21,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +23: [2023-05-13 03:28:21,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +23: [2023-05-13 03:28:21,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +23: [2023-05-13 03:28:21,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +22: [2023-05-13 03:28:21,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +22: [2023-05-13 03:28:21,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +22: [2023-05-13 03:28:21,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +22: [2023-05-13 03:28:21,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +28: [2023-05-13 03:28:21,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +28: [2023-05-13 03:28:21,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +28: [2023-05-13 03:28:21,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +28: [2023-05-13 03:28:21,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +23: [2023-05-13 03:28:21,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +23: [2023-05-13 03:28:21,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +14: [2023-05-13 03:28:21,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 2: [2023-05-13 03:28:21,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +31: [2023-05-13 03:28:21,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +31: [2023-05-13 03:28:21,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +31: [2023-05-13 03:28:21,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +31: [2023-05-13 03:28:21,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +31: [2023-05-13 03:28:21,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +31: [2023-05-13 03:28:21,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +31: [2023-05-13 03:28:21,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +31: [2023-05-13 03:28:21,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 2: [2023-05-13 03:28:21,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +13: [2023-05-13 03:28:21,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +14: [2023-05-13 03:28:21,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +14: [2023-05-13 03:28:21,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +20: [2023-05-13 03:28:21,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +14: [2023-05-13 03:28:21,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +14: [2023-05-13 03:28:21,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +16: [2023-05-13 03:28:21,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +26: [2023-05-13 03:28:21,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +16: [2023-05-13 03:28:21,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +20: [2023-05-13 03:28:21,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +26: [2023-05-13 03:28:21,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +13: [2023-05-13 03:28:21,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +26: [2023-05-13 03:28:21,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +31: [2023-05-13 03:28:21,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +31: [2023-05-13 03:28:21,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +16: [2023-05-13 03:28:21,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 5: [2023-05-13 03:28:21,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +26: [2023-05-13 03:28:21,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +13: [2023-05-13 03:28:21,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +13: [2023-05-13 03:28:21,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +26: [2023-05-13 03:28:21,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +13: [2023-05-13 03:28:21,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +16: [2023-05-13 03:28:21,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +16: [2023-05-13 03:28:21,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +13: [2023-05-13 03:28:21,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +16: [2023-05-13 03:28:21,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +16: [2023-05-13 03:28:21,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +16: [2023-05-13 03:28:21,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 5: [2023-05-13 03:28:21,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +31: [2023-05-13 03:28:21,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +31: [2023-05-13 03:28:21,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +31: [2023-05-13 03:28:21,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +31: [2023-05-13 03:28:21,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +12: [2023-05-13 03:28:21,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +12: [2023-05-13 03:28:21,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 0: [2023-05-13 03:28:21,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +12: [2023-05-13 03:28:21,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +31: [2023-05-13 03:28:21,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +31: [2023-05-13 03:28:21,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 7: [2023-05-13 03:28:21,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +28: [2023-05-13 03:28:21,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 7: [2023-05-13 03:28:21,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +28: [2023-05-13 03:28:21,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +28: [2023-05-13 03:28:21,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +29: [2023-05-13 03:28:21,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +29: [2023-05-13 03:28:21,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +22: [2023-05-13 03:28:21,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +17: [2023-05-13 03:28:21,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +25: [2023-05-13 03:28:21,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +25: [2023-05-13 03:28:21,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +25: [2023-05-13 03:28:21,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +22: [2023-05-13 03:28:21,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +29: [2023-05-13 03:28:21,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +29: [2023-05-13 03:28:21,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +23: [2023-05-13 03:28:21,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +29: [2023-05-13 03:28:21,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +29: [2023-05-13 03:28:21,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +29: [2023-05-13 03:28:21,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +29: [2023-05-13 03:28:21,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 8: [2023-05-13 03:28:21,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +17: [2023-05-13 03:28:21,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +17: [2023-05-13 03:28:21,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +23: [2023-05-13 03:28:21,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +17: [2023-05-13 03:28:21,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 8: [2023-05-13 03:28:21,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +22: [2023-05-13 03:28:21,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +20: [2023-05-13 03:28:21,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +20: [2023-05-13 03:28:21,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +20: [2023-05-13 03:28:21,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +22: [2023-05-13 03:28:21,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +29: [2023-05-13 03:28:21,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +29: [2023-05-13 03:28:21,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +17: [2023-05-13 03:28:21,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +12: [2023-05-13 03:28:21,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +12: [2023-05-13 03:28:21,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +12: [2023-05-13 03:28:21,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +12: [2023-05-13 03:28:21,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +12: [2023-05-13 03:28:21,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +20: [2023-05-13 03:28:21,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +20: [2023-05-13 03:28:21,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +20: [2023-05-13 03:28:21,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +23: [2023-05-13 03:28:21,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +23: [2023-05-13 03:28:21,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +17: [2023-05-13 03:28:21,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +28: [2023-05-13 03:28:21,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +17: [2023-05-13 03:28:21,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +23: [2023-05-13 03:28:21,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +28: [2023-05-13 03:28:21,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +28: [2023-05-13 03:28:21,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +23: [2023-05-13 03:28:21,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +20: [2023-05-13 03:28:21,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +20: [2023-05-13 03:28:21,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +28: [2023-05-13 03:28:21,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +25: [2023-05-13 03:28:21,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +25: [2023-05-13 03:28:21,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +25: [2023-05-13 03:28:21,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +25: [2023-05-13 03:28:21,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +19: [2023-05-13 03:28:21,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +25: [2023-05-13 03:28:21,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +29: [2023-05-13 03:28:21,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +29: [2023-05-13 03:28:21,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +27: [2023-05-13 03:28:21,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +27: [2023-05-13 03:28:21,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +27: [2023-05-13 03:28:21,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +29: [2023-05-13 03:28:21,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 6: [2023-05-13 03:28:21,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 6: [2023-05-13 03:28:21,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +27: [2023-05-13 03:28:21,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +27: [2023-05-13 03:28:21,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +27: [2023-05-13 03:28:21,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +27: [2023-05-13 03:28:21,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +29: [2023-05-13 03:28:21,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +27: [2023-05-13 03:28:21,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +29: [2023-05-13 03:28:21,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +19: [2023-05-13 03:28:21,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +19: [2023-05-13 03:28:21,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +29: [2023-05-13 03:28:21,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +22: [2023-05-13 03:28:21,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +22: [2023-05-13 03:28:21,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +12: [2023-05-13 03:28:21,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:21,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +12: [2023-05-13 03:28:21,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +22: [2023-05-13 03:28:21,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +22: [2023-05-13 03:28:21,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 0: [2023-05-13 03:28:21,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +19: [2023-05-13 03:28:21,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 3: [2023-05-13 03:28:21,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +12: [2023-05-13 03:28:21,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 3: [2023-05-13 03:28:21,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 1: [2023-05-13 03:28:21,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +27: [2023-05-13 03:28:21,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +27: [2023-05-13 03:28:21,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +27: [2023-05-13 03:28:21,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +19: [2023-05-13 03:28:21,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +25: [2023-05-13 03:28:21,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +19: [2023-05-13 03:28:22,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +19: [2023-05-13 03:28:22,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +19: [2023-05-13 03:28:22,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +25: [2023-05-13 03:28:22,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +25: [2023-05-13 03:28:22,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +27: [2023-05-13 03:28:22,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +27: [2023-05-13 03:28:22,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +20: [2023-05-13 03:28:22,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt... +31: [2023-05-13 03:28:22,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +31: [2023-05-13 03:28:22,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +20: [2023-05-13 03:28:22,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +20: [2023-05-13 03:28:22,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +12: [2023-05-13 03:28:22,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +19: [2023-05-13 03:28:22,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +12: [2023-05-13 03:28:22,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +12: [2023-05-13 03:28:22,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +20: [2023-05-13 03:28:22,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +25: [2023-05-13 03:28:22,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +20: [2023-05-13 03:28:22,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +12: [2023-05-13 03:28:22,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +25: [2023-05-13 03:28:22,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +12: [2023-05-13 03:28:22,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +20: [2023-05-13 03:28:22,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +25: [2023-05-13 03:28:22,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +19: [2023-05-13 03:28:22,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +25: [2023-05-13 03:28:22,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +19: [2023-05-13 03:28:22,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +25: [2023-05-13 03:28:22,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 3: [2023-05-13 03:28:22,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 3: [2023-05-13 03:28:22,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +19: [2023-05-13 03:28:22,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 3: [2023-05-13 03:28:22,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 3: [2023-05-13 03:28:22,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +19: [2023-05-13 03:28:22,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 3: [2023-05-13 03:28:22,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +29: [2023-05-13 03:28:22,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +29: [2023-05-13 03:28:22,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +19: [2023-05-13 03:28:22,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +31: [2023-05-13 03:28:22,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +19: [2023-05-13 03:28:22,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +31: [2023-05-13 03:28:22,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +19: [2023-05-13 03:28:22,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +31: [2023-05-13 03:28:22,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +31: [2023-05-13 03:28:22,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +31: [2023-05-13 03:28:22,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +31: [2023-05-13 03:28:22,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +31: [2023-05-13 03:28:22,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +31: [2023-05-13 03:28:22,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +29: [2023-05-13 03:28:22,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +29: [2023-05-13 03:28:22,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +29: [2023-05-13 03:28:22,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +29: [2023-05-13 03:28:22,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +29: [2023-05-13 03:28:22,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +29: [2023-05-13 03:28:22,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +29: [2023-05-13 03:28:22,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +29: [2023-05-13 03:28:22,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +27: [2023-05-13 03:28:22,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +31: [2023-05-13 03:28:22,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +31: [2023-05-13 03:28:22,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +31: [2023-05-13 03:28:22,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +31: [2023-05-13 03:28:22,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +27: [2023-05-13 03:28:22,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +31: [2023-05-13 03:28:22,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +31: [2023-05-13 03:28:22,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +29: [2023-05-13 03:28:22,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +29: [2023-05-13 03:28:22,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +27: [2023-05-13 03:28:22,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +27: [2023-05-13 03:28:22,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +27: [2023-05-13 03:28:22,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. +27: [2023-05-13 03:28:22,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_05-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +29: [2023-05-13 03:28:22,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +29: [2023-05-13 03:28:22,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +29: [2023-05-13 03:28:22,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +29: [2023-05-13 03:28:22,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 9: [2023-05-13 03:28:22,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 9: [2023-05-13 03:28:22,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 9: [2023-05-13 03:28:22,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 9: [2023-05-13 03:28:22,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 9: [2023-05-13 03:28:22,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 9: [2023-05-13 03:28:22,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 9: [2023-05-13 03:28:22,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 9: [2023-05-13 03:28:22,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +11: [2023-05-13 03:28:22,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +11: [2023-05-13 03:28:22,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +11: [2023-05-13 03:28:22,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +11: [2023-05-13 03:28:22,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +10: [2023-05-13 03:28:22,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +10: [2023-05-13 03:28:22,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +10: [2023-05-13 03:28:22,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +11: [2023-05-13 03:28:22,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +11: [2023-05-13 03:28:22,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +11: [2023-05-13 03:28:22,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +24: [2023-05-13 03:28:22,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +24: [2023-05-13 03:28:22,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +24: [2023-05-13 03:28:22,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +24: [2023-05-13 03:28:22,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +24: [2023-05-13 03:28:22,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +10: [2023-05-13 03:28:22,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +11: [2023-05-13 03:28:22,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +24: [2023-05-13 03:28:22,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +24: [2023-05-13 03:28:22,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +24: [2023-05-13 03:28:22,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +10: [2023-05-13 03:28:22,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +10: [2023-05-13 03:28:22,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +10: [2023-05-13 03:28:22,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +10: [2023-05-13 03:28:22,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +10: [2023-05-13 03:28:22,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +10: [2023-05-13 03:28:22,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +11: [2023-05-13 03:28:22,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +24: [2023-05-13 03:28:22,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +24: [2023-05-13 03:28:22,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +24: [2023-05-13 03:28:22,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +24: [2023-05-13 03:28:22,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +24: [2023-05-13 03:28:22,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +24: [2023-05-13 03:28:22,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +24: [2023-05-13 03:28:22,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +10: [2023-05-13 03:28:22,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +10: [2023-05-13 03:28:22,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +10: [2023-05-13 03:28:22,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +24: [2023-05-13 03:28:22,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +10: [2023-05-13 03:28:22,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +10: [2023-05-13 03:28:22,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +10: [2023-05-13 03:28:22,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +11: [2023-05-13 03:28:22,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +11: [2023-05-13 03:28:22,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +11: [2023-05-13 03:28:22,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +11: [2023-05-13 03:28:22,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +11: [2023-05-13 03:28:22,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +11: [2023-05-13 03:28:22,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +11: [2023-05-13 03:28:22,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +18: [2023-05-13 03:28:22,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +18: [2023-05-13 03:28:22,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +18: [2023-05-13 03:28:22,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +18: [2023-05-13 03:28:22,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +18: [2023-05-13 03:28:22,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +18: [2023-05-13 03:28:22,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +18: [2023-05-13 03:28:22,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +18: [2023-05-13 03:28:22,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +18: [2023-05-13 03:28:22,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +18: [2023-05-13 03:28:22,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +18: [2023-05-13 03:28:22,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +18: [2023-05-13 03:28:22,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +18: [2023-05-13 03:28:22,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +18: [2023-05-13 03:28:22,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +18: [2023-05-13 03:28:22,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +18: [2023-05-13 03:28:22,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +11: [2023-05-13 03:28:22,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +10: [2023-05-13 03:28:22,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +10: [2023-05-13 03:28:22,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +24: [2023-05-13 03:28:22,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +24: [2023-05-13 03:28:22,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +24: [2023-05-13 03:28:22,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 9: [2023-05-13 03:28:22,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +11: [2023-05-13 03:28:22,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +24: [2023-05-13 03:28:22,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +24: [2023-05-13 03:28:22,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +24: [2023-05-13 03:28:22,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +24: [2023-05-13 03:28:22,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +24: [2023-05-13 03:28:22,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +10: [2023-05-13 03:28:22,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +10: [2023-05-13 03:28:22,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +10: [2023-05-13 03:28:22,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +30: [2023-05-13 03:28:22,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 9: [2023-05-13 03:28:22,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 9: [2023-05-13 03:28:22,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +10: [2023-05-13 03:28:22,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +10: [2023-05-13 03:28:22,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +10: [2023-05-13 03:28:22,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +10: [2023-05-13 03:28:22,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +10: [2023-05-13 03:28:22,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 9: [2023-05-13 03:28:22,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 9: [2023-05-13 03:28:22,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 9: [2023-05-13 03:28:22,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +30: [2023-05-13 03:28:22,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +30: [2023-05-13 03:28:22,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +11: [2023-05-13 03:28:22,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +11: [2023-05-13 03:28:22,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +11: [2023-05-13 03:28:22,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +11: [2023-05-13 03:28:22,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +11: [2023-05-13 03:28:22,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +11: [2023-05-13 03:28:22,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +11: [2023-05-13 03:28:22,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +24: [2023-05-13 03:28:22,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +24: [2023-05-13 03:28:22,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +18: [2023-05-13 03:28:22,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +18: [2023-05-13 03:28:22,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +18: [2023-05-13 03:28:22,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +26: [2023-05-13 03:28:22,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +26: [2023-05-13 03:28:22,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +26: [2023-05-13 03:28:22,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +26: [2023-05-13 03:28:22,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +26: [2023-05-13 03:28:22,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +26: [2023-05-13 03:28:22,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +26: [2023-05-13 03:28:22,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +26: [2023-05-13 03:28:22,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +22: [2023-05-13 03:28:22,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +22: [2023-05-13 03:28:22,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +24: [2023-05-13 03:28:22,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +22: [2023-05-13 03:28:22,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +22: [2023-05-13 03:28:22,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +14: [2023-05-13 03:28:22,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +14: [2023-05-13 03:28:22,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +14: [2023-05-13 03:28:22,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +21: [2023-05-13 03:28:22,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +21: [2023-05-13 03:28:22,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +22: [2023-05-13 03:28:22,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +22: [2023-05-13 03:28:22,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +22: [2023-05-13 03:28:22,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +21: [2023-05-13 03:28:22,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +14: [2023-05-13 03:28:22,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +14: [2023-05-13 03:28:22,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +14: [2023-05-13 03:28:22,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +14: [2023-05-13 03:28:22,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +22: [2023-05-13 03:28:22,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +18: [2023-05-13 03:28:22,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +14: [2023-05-13 03:28:22,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +16: [2023-05-13 03:28:22,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +16: [2023-05-13 03:28:22,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +10: [2023-05-13 03:28:22,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +21: [2023-05-13 03:28:22,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +21: [2023-05-13 03:28:22,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +24: [2023-05-13 03:28:22,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +21: [2023-05-13 03:28:22,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +21: [2023-05-13 03:28:22,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +21: [2023-05-13 03:28:22,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +16: [2023-05-13 03:28:22,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +16: [2023-05-13 03:28:22,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +16: [2023-05-13 03:28:22,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +16: [2023-05-13 03:28:22,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +16: [2023-05-13 03:28:22,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +16: [2023-05-13 03:28:22,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +24: [2023-05-13 03:28:22,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +26: [2023-05-13 03:28:22,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +26: [2023-05-13 03:28:22,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +26: [2023-05-13 03:28:22,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +26: [2023-05-13 03:28:22,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +26: [2023-05-13 03:28:22,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +26: [2023-05-13 03:28:22,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +21: [2023-05-13 03:28:22,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +21: [2023-05-13 03:28:22,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +21: [2023-05-13 03:28:22,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +18: [2023-05-13 03:28:22,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +18: [2023-05-13 03:28:22,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +18: [2023-05-13 03:28:22,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +18: [2023-05-13 03:28:22,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +26: [2023-05-13 03:28:22,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +14: [2023-05-13 03:28:22,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +14: [2023-05-13 03:28:22,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +14: [2023-05-13 03:28:22,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +16: [2023-05-13 03:28:22,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +16: [2023-05-13 03:28:22,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +14: [2023-05-13 03:28:22,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +14: [2023-05-13 03:28:22,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +26: [2023-05-13 03:28:22,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +14: [2023-05-13 03:28:22,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +22: [2023-05-13 03:28:22,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +22: [2023-05-13 03:28:22,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +14: [2023-05-13 03:28:22,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +14: [2023-05-13 03:28:22,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +16: [2023-05-13 03:28:22,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +16: [2023-05-13 03:28:22,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +16: [2023-05-13 03:28:22,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +16: [2023-05-13 03:28:22,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +21: [2023-05-13 03:28:22,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +24: [2023-05-13 03:28:22,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +24: [2023-05-13 03:28:22,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +24: [2023-05-13 03:28:22,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +16: [2023-05-13 03:28:22,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +21: [2023-05-13 03:28:22,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +16: [2023-05-13 03:28:22,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +21: [2023-05-13 03:28:22,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +21: [2023-05-13 03:28:22,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +21: [2023-05-13 03:28:22,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +10: [2023-05-13 03:28:22,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +22: [2023-05-13 03:28:22,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +22: [2023-05-13 03:28:22,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +22: [2023-05-13 03:28:22,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +22: [2023-05-13 03:28:22,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +15: [2023-05-13 03:28:22,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +10: [2023-05-13 03:28:22,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +18: [2023-05-13 03:28:22,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +15: [2023-05-13 03:28:22,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +15: [2023-05-13 03:28:22,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +15: [2023-05-13 03:28:22,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +15: [2023-05-13 03:28:22,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +15: [2023-05-13 03:28:22,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +18: [2023-05-13 03:28:22,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +11: [2023-05-13 03:28:22,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +22: [2023-05-13 03:28:22,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +22: [2023-05-13 03:28:22,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +10: [2023-05-13 03:28:22,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +18: [2023-05-13 03:28:22,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +10: [2023-05-13 03:28:22,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +10: [2023-05-13 03:28:22,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +11: [2023-05-13 03:28:22,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +11: [2023-05-13 03:28:22,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +15: [2023-05-13 03:28:22,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +11: [2023-05-13 03:28:22,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +11: [2023-05-13 03:28:22,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +11: [2023-05-13 03:28:22,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +11: [2023-05-13 03:28:22,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +18: [2023-05-13 03:28:22,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +17: [2023-05-13 03:28:22,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +17: [2023-05-13 03:28:22,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +17: [2023-05-13 03:28:22,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +17: [2023-05-13 03:28:22,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +17: [2023-05-13 03:28:22,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +17: [2023-05-13 03:28:22,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +17: [2023-05-13 03:28:22,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +17: [2023-05-13 03:28:22,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 9: [2023-05-13 03:28:22,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +15: [2023-05-13 03:28:22,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +15: [2023-05-13 03:28:22,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +15: [2023-05-13 03:28:22,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +15: [2023-05-13 03:28:22,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +15: [2023-05-13 03:28:22,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +17: [2023-05-13 03:28:22,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +18: [2023-05-13 03:28:22,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +18: [2023-05-13 03:28:22,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +30: [2023-05-13 03:28:22,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +18: [2023-05-13 03:28:22,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +17: [2023-05-13 03:28:22,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +17: [2023-05-13 03:28:22,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +18: [2023-05-13 03:28:22,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +17: [2023-05-13 03:28:22,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +17: [2023-05-13 03:28:22,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +30: [2023-05-13 03:28:22,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +17: [2023-05-13 03:28:22,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +17: [2023-05-13 03:28:22,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +17: [2023-05-13 03:28:22,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +30: [2023-05-13 03:28:22,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +21: [2023-05-13 03:28:22,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +21: [2023-05-13 03:28:22,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +21: [2023-05-13 03:28:22,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +26: [2023-05-13 03:28:22,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +26: [2023-05-13 03:28:22,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +26: [2023-05-13 03:28:22,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +16: [2023-05-13 03:28:22,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +16: [2023-05-13 03:28:22,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +22: [2023-05-13 03:28:22,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +22: [2023-05-13 03:28:22,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +14: [2023-05-13 03:28:22,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +14: [2023-05-13 03:28:22,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +14: [2023-05-13 03:28:22,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +16: [2023-05-13 03:28:22,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +16: [2023-05-13 03:28:22,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +16: [2023-05-13 03:28:22,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +16: [2023-05-13 03:28:22,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +16: [2023-05-13 03:28:22,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +16: [2023-05-13 03:28:22,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +26: [2023-05-13 03:28:22,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +26: [2023-05-13 03:28:22,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +26: [2023-05-13 03:28:22,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +15: [2023-05-13 03:28:22,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +26: [2023-05-13 03:28:22,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +26: [2023-05-13 03:28:22,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +14: [2023-05-13 03:28:22,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +21: [2023-05-13 03:28:22,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +21: [2023-05-13 03:28:22,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +14: [2023-05-13 03:28:22,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +14: [2023-05-13 03:28:22,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +14: [2023-05-13 03:28:22,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +14: [2023-05-13 03:28:22,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +21: [2023-05-13 03:28:22,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +21: [2023-05-13 03:28:22,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +21: [2023-05-13 03:28:22,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +30: [2023-05-13 03:28:22,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +30: [2023-05-13 03:28:22,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +17: [2023-05-13 03:28:22,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +30: [2023-05-13 03:28:22,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +21: [2023-05-13 03:28:22,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +21: [2023-05-13 03:28:22,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +21: [2023-05-13 03:28:22,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +26: [2023-05-13 03:28:22,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +22: [2023-05-13 03:28:22,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +22: [2023-05-13 03:28:22,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +22: [2023-05-13 03:28:22,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +22: [2023-05-13 03:28:22,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +22: [2023-05-13 03:28:22,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +22: [2023-05-13 03:28:22,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +26: [2023-05-13 03:28:22,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +16: [2023-05-13 03:28:22,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +26: [2023-05-13 03:28:22,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +16: [2023-05-13 03:28:22,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +14: [2023-05-13 03:28:22,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +14: [2023-05-13 03:28:22,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +16: [2023-05-13 03:28:22,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +14: [2023-05-13 03:28:22,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +26: [2023-05-13 03:28:22,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +26: [2023-05-13 03:28:22,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +26: [2023-05-13 03:28:22,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +21: [2023-05-13 03:28:22,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +14: [2023-05-13 03:28:22,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +22: [2023-05-13 03:28:22,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +22: [2023-05-13 03:28:22,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +16: [2023-05-13 03:28:22,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +21: [2023-05-13 03:28:22,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +16: [2023-05-13 03:28:22,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +16: [2023-05-13 03:28:22,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +16: [2023-05-13 03:28:22,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +16: [2023-05-13 03:28:22,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +26: [2023-05-13 03:28:22,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +26: [2023-05-13 03:28:22,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +17: [2023-05-13 03:28:22,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +14: [2023-05-13 03:28:22,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +15: [2023-05-13 03:28:22,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +15: [2023-05-13 03:28:22,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +15: [2023-05-13 03:28:22,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +14: [2023-05-13 03:28:22,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +14: [2023-05-13 03:28:22,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +14: [2023-05-13 03:28:22,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +15: [2023-05-13 03:28:22,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +15: [2023-05-13 03:28:22,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +21: [2023-05-13 03:28:22,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +21: [2023-05-13 03:28:22,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +19: [2023-05-13 03:28:22,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +19: [2023-05-13 03:28:22,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +19: [2023-05-13 03:28:22,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +19: [2023-05-13 03:28:22,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +19: [2023-05-13 03:28:22,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +19: [2023-05-13 03:28:22,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +19: [2023-05-13 03:28:22,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +19: [2023-05-13 03:28:22,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +21: [2023-05-13 03:28:22,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +13: [2023-05-13 03:28:22,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +13: [2023-05-13 03:28:22,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +13: [2023-05-13 03:28:22,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +13: [2023-05-13 03:28:22,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +13: [2023-05-13 03:28:22,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +13: [2023-05-13 03:28:22,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +13: [2023-05-13 03:28:22,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +12: [2023-05-13 03:28:22,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +12: [2023-05-13 03:28:22,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +12: [2023-05-13 03:28:22,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +12: [2023-05-13 03:28:22,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +12: [2023-05-13 03:28:22,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +12: [2023-05-13 03:28:22,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +12: [2023-05-13 03:28:22,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +13: [2023-05-13 03:28:22,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +12: [2023-05-13 03:28:22,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +17: [2023-05-13 03:28:22,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +17: [2023-05-13 03:28:22,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +17: [2023-05-13 03:28:22,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +19: [2023-05-13 03:28:22,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +19: [2023-05-13 03:28:22,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +23: [2023-05-13 03:28:22,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +19: [2023-05-13 03:28:22,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +13: [2023-05-13 03:28:22,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +13: [2023-05-13 03:28:22,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +13: [2023-05-13 03:28:22,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +23: [2023-05-13 03:28:22,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +13: [2023-05-13 03:28:22,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +13: [2023-05-13 03:28:22,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +19: [2023-05-13 03:28:22,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +12: [2023-05-13 03:28:22,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +12: [2023-05-13 03:28:22,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +12: [2023-05-13 03:28:22,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +12: [2023-05-13 03:28:22,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +12: [2023-05-13 03:28:22,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +12: [2023-05-13 03:28:22,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +12: [2023-05-13 03:28:22,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +19: [2023-05-13 03:28:22,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +12: [2023-05-13 03:28:22,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +13: [2023-05-13 03:28:22,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +19: [2023-05-13 03:28:22,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +13: [2023-05-13 03:28:22,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +13: [2023-05-13 03:28:22,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +17: [2023-05-13 03:28:22,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +19: [2023-05-13 03:28:22,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +23: [2023-05-13 03:28:22,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +17: [2023-05-13 03:28:22,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +19: [2023-05-13 03:28:22,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +17: [2023-05-13 03:28:22,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +17: [2023-05-13 03:28:22,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +23: [2023-05-13 03:28:22,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +23: [2023-05-13 03:28:22,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +23: [2023-05-13 03:28:22,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +23: [2023-05-13 03:28:22,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +23: [2023-05-13 03:28:22,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +23: [2023-05-13 03:28:22,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +23: [2023-05-13 03:28:22,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +23: [2023-05-13 03:28:22,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +22: [2023-05-13 03:28:22,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +22: [2023-05-13 03:28:22,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +22: [2023-05-13 03:28:22,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +23: [2023-05-13 03:28:22,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +23: [2023-05-13 03:28:22,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +22: [2023-05-13 03:28:22,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +23: [2023-05-13 03:28:22,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +23: [2023-05-13 03:28:22,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +23: [2023-05-13 03:28:22,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +22: [2023-05-13 03:28:22,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +22: [2023-05-13 03:28:22,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +28: [2023-05-13 03:28:22,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +15: [2023-05-13 03:28:22,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +28: [2023-05-13 03:28:22,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +28: [2023-05-13 03:28:22,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +28: [2023-05-13 03:28:22,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +28: [2023-05-13 03:28:22,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +28: [2023-05-13 03:28:22,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +28: [2023-05-13 03:28:22,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +20: [2023-05-13 03:28:22,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +20: [2023-05-13 03:28:22,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +28: [2023-05-13 03:28:22,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 5: [2023-05-13 03:28:22,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +20: [2023-05-13 03:28:22,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +20: [2023-05-13 03:28:22,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +20: [2023-05-13 03:28:22,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +20: [2023-05-13 03:28:22,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +20: [2023-05-13 03:28:22,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +20: [2023-05-13 03:28:22,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +15: [2023-05-13 03:28:22,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +17: [2023-05-13 03:28:22,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +28: [2023-05-13 03:28:22,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +25: [2023-05-13 03:28:22,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +25: [2023-05-13 03:28:22,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +25: [2023-05-13 03:28:22,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +31: [2023-05-13 03:28:22,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +25: [2023-05-13 03:28:22,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +25: [2023-05-13 03:28:22,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +25: [2023-05-13 03:28:22,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +25: [2023-05-13 03:28:22,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +25: [2023-05-13 03:28:22,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +31: [2023-05-13 03:28:22,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +31: [2023-05-13 03:28:22,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +31: [2023-05-13 03:28:22,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +31: [2023-05-13 03:28:22,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +31: [2023-05-13 03:28:22,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +31: [2023-05-13 03:28:22,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +31: [2023-05-13 03:28:22,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +20: [2023-05-13 03:28:22,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 8: [2023-05-13 03:28:22,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +20: [2023-05-13 03:28:22,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 5: [2023-05-13 03:28:22,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 5: [2023-05-13 03:28:22,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +27: [2023-05-13 03:28:22,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +27: [2023-05-13 03:28:22,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +27: [2023-05-13 03:28:22,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +27: [2023-05-13 03:28:22,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +27: [2023-05-13 03:28:22,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +31: [2023-05-13 03:28:22,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +31: [2023-05-13 03:28:22,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +17: [2023-05-13 03:28:22,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 5: [2023-05-13 03:28:22,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +25: [2023-05-13 03:28:22,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +25: [2023-05-13 03:28:22,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 3: [2023-05-13 03:28:22,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +25: [2023-05-13 03:28:22,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 3: [2023-05-13 03:28:22,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 8: [2023-05-13 03:28:22,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +20: [2023-05-13 03:28:22,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +20: [2023-05-13 03:28:22,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +25: [2023-05-13 03:28:22,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +20: [2023-05-13 03:28:22,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 5: [2023-05-13 03:28:22,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +25: [2023-05-13 03:28:22,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 5: [2023-05-13 03:28:22,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +25: [2023-05-13 03:28:22,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +17: [2023-05-13 03:28:22,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +17: [2023-05-13 03:28:22,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +17: [2023-05-13 03:28:22,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +20: [2023-05-13 03:28:22,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +20: [2023-05-13 03:28:22,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 3: [2023-05-13 03:28:22,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +25: [2023-05-13 03:28:22,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 3: [2023-05-13 03:28:22,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +20: [2023-05-13 03:28:22,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +28: [2023-05-13 03:28:22,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +25: [2023-05-13 03:28:22,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +28: [2023-05-13 03:28:22,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +28: [2023-05-13 03:28:22,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +17: [2023-05-13 03:28:22,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +17: [2023-05-13 03:28:22,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +28: [2023-05-13 03:28:22,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +28: [2023-05-13 03:28:22,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +28: [2023-05-13 03:28:22,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +28: [2023-05-13 03:28:22,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +31: [2023-05-13 03:28:22,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +31: [2023-05-13 03:28:22,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +31: [2023-05-13 03:28:22,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +31: [2023-05-13 03:28:22,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +31: [2023-05-13 03:28:22,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +31: [2023-05-13 03:28:22,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 8: [2023-05-13 03:28:22,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 8: [2023-05-13 03:28:22,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 3: [2023-05-13 03:28:22,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 3: [2023-05-13 03:28:22,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 8: [2023-05-13 03:28:22,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 3: [2023-05-13 03:28:22,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 3: [2023-05-13 03:28:22,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 8: [2023-05-13 03:28:22,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 8: [2023-05-13 03:28:22,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 3: [2023-05-13 03:28:22,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 8: [2023-05-13 03:28:22,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 3: [2023-05-13 03:28:22,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +27: [2023-05-13 03:28:22,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +12: [2023-05-13 03:28:22,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +12: [2023-05-13 03:28:22,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +13: [2023-05-13 03:28:22,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +13: [2023-05-13 03:28:22,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +12: [2023-05-13 03:28:22,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +13: [2023-05-13 03:28:22,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +19: [2023-05-13 03:28:22,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +19: [2023-05-13 03:28:22,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +19: [2023-05-13 03:28:22,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +23: [2023-05-13 03:28:22,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +23: [2023-05-13 03:28:22,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +13: [2023-05-13 03:28:22,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +13: [2023-05-13 03:28:22,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +13: [2023-05-13 03:28:22,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +13: [2023-05-13 03:28:22,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +19: [2023-05-13 03:28:22,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +19: [2023-05-13 03:28:22,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +19: [2023-05-13 03:28:22,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +19: [2023-05-13 03:28:22,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +19: [2023-05-13 03:28:22,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +13: [2023-05-13 03:28:22,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +12: [2023-05-13 03:28:22,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +12: [2023-05-13 03:28:22,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +12: [2023-05-13 03:28:22,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +12: [2023-05-13 03:28:22,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +12: [2023-05-13 03:28:22,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +28: [2023-05-13 03:28:22,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +13: [2023-05-13 03:28:22,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +12: [2023-05-13 03:28:22,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +12: [2023-05-13 03:28:22,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +13: [2023-05-13 03:28:22,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +23: [2023-05-13 03:28:22,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +13: [2023-05-13 03:28:22,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +19: [2023-05-13 03:28:22,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +19: [2023-05-13 03:28:22,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +23: [2023-05-13 03:28:22,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +31: [2023-05-13 03:28:22,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +12: [2023-05-13 03:28:22,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +31: [2023-05-13 03:28:22,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +23: [2023-05-13 03:28:22,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +23: [2023-05-13 03:28:22,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +23: [2023-05-13 03:28:22,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +23: [2023-05-13 03:28:22,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +20: [2023-05-13 03:28:22,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +20: [2023-05-13 03:28:22,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +23: [2023-05-13 03:28:22,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 8: [2023-05-13 03:28:22,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +23: [2023-05-13 03:28:22,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +27: [2023-05-13 03:28:22,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +25: [2023-05-13 03:28:22,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +25: [2023-05-13 03:28:22,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +25: [2023-05-13 03:28:22,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +19: [2023-05-13 03:28:22,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 5: [2023-05-13 03:28:22,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +13: [2023-05-13 03:28:22,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +13: [2023-05-13 03:28:22,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +13: [2023-05-13 03:28:22,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +13: [2023-05-13 03:28:22,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 5: [2023-05-13 03:28:22,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +25: [2023-05-13 03:28:22,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +28: [2023-05-13 03:28:22,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +13: [2023-05-13 03:28:22,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +19: [2023-05-13 03:28:22,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +12: [2023-05-13 03:28:22,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +12: [2023-05-13 03:28:22,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +19: [2023-05-13 03:28:22,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +19: [2023-05-13 03:28:22,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +19: [2023-05-13 03:28:22,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +19: [2023-05-13 03:28:22,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +25: [2023-05-13 03:28:22,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +25: [2023-05-13 03:28:22,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +25: [2023-05-13 03:28:22,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +25: [2023-05-13 03:28:22,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +12: [2023-05-13 03:28:22,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +12: [2023-05-13 03:28:22,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +12: [2023-05-13 03:28:22,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +31: [2023-05-13 03:28:22,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +23: [2023-05-13 03:28:22,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +31: [2023-05-13 03:28:22,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +20: [2023-05-13 03:28:22,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +20: [2023-05-13 03:28:22,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +20: [2023-05-13 03:28:22,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +31: [2023-05-13 03:28:22,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +31: [2023-05-13 03:28:22,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +31: [2023-05-13 03:28:22,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +28: [2023-05-13 03:28:22,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +28: [2023-05-13 03:28:22,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +28: [2023-05-13 03:28:22,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +20: [2023-05-13 03:28:22,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +20: [2023-05-13 03:28:22,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +20: [2023-05-13 03:28:22,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +27: [2023-05-13 03:28:22,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 8: [2023-05-13 03:28:22,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +31: [2023-05-13 03:28:22,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +31: [2023-05-13 03:28:22,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +31: [2023-05-13 03:28:22,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +25: [2023-05-13 03:28:22,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 3: [2023-05-13 03:28:22,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +20: [2023-05-13 03:28:22,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +28: [2023-05-13 03:28:22,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +28: [2023-05-13 03:28:22,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +28: [2023-05-13 03:28:22,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +28: [2023-05-13 03:28:22,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +20: [2023-05-13 03:28:22,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 5: [2023-05-13 03:28:22,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 5: [2023-05-13 03:28:22,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 3: [2023-05-13 03:28:22,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 5: [2023-05-13 03:28:22,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 8: [2023-05-13 03:28:22,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +27: [2023-05-13 03:28:22,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +27: [2023-05-13 03:28:22,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +25: [2023-05-13 03:28:22,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +25: [2023-05-13 03:28:22,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +23: [2023-05-13 03:28:22,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +23: [2023-05-13 03:28:22,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +23: [2023-05-13 03:28:22,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +23: [2023-05-13 03:28:22,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +23: [2023-05-13 03:28:22,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +29: [2023-05-13 03:28:22,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +29: [2023-05-13 03:28:22,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +29: [2023-05-13 03:28:22,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +29: [2023-05-13 03:28:22,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +29: [2023-05-13 03:28:22,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +29: [2023-05-13 03:28:22,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +29: [2023-05-13 03:28:22,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +29: [2023-05-13 03:28:22,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 5: [2023-05-13 03:28:22,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +29: [2023-05-13 03:28:22,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +29: [2023-05-13 03:28:22,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +25: [2023-05-13 03:28:22,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 5: [2023-05-13 03:28:22,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +25: [2023-05-13 03:28:22,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +25: [2023-05-13 03:28:22,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +25: [2023-05-13 03:28:22,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +27: [2023-05-13 03:28:22,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +27: [2023-05-13 03:28:22,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +27: [2023-05-13 03:28:22,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +27: [2023-05-13 03:28:22,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +27: [2023-05-13 03:28:22,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +25: [2023-05-13 03:28:22,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +29: [2023-05-13 03:28:22,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +29: [2023-05-13 03:28:22,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +29: [2023-05-13 03:28:22,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +29: [2023-05-13 03:28:22,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +29: [2023-05-13 03:28:22,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +29: [2023-05-13 03:28:22,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt... +20: [2023-05-13 03:28:22,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +20: [2023-05-13 03:28:22,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 8: [2023-05-13 03:28:22,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +20: [2023-05-13 03:28:22,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +27: [2023-05-13 03:28:22,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +27: [2023-05-13 03:28:22,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +20: [2023-05-13 03:28:22,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 3: [2023-05-13 03:28:22,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 3: [2023-05-13 03:28:22,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 3: [2023-05-13 03:28:22,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +20: [2023-05-13 03:28:22,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 8: [2023-05-13 03:28:22,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +20: [2023-05-13 03:28:22,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +28: [2023-05-13 03:28:22,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 3: [2023-05-13 03:28:22,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +28: [2023-05-13 03:28:22,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 8: [2023-05-13 03:28:22,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +28: [2023-05-13 03:28:22,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 8: [2023-05-13 03:28:22,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 8: [2023-05-13 03:28:22,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 3: [2023-05-13 03:28:22,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +28: [2023-05-13 03:28:22,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 8: [2023-05-13 03:28:22,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +28: [2023-05-13 03:28:22,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +28: [2023-05-13 03:28:22,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +28: [2023-05-13 03:28:22,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +31: [2023-05-13 03:28:22,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +31: [2023-05-13 03:28:22,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +31: [2023-05-13 03:28:22,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +31: [2023-05-13 03:28:22,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +31: [2023-05-13 03:28:22,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +31: [2023-05-13 03:28:22,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +27: [2023-05-13 03:28:22,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +27: [2023-05-13 03:28:22,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +27: [2023-05-13 03:28:22,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +27: [2023-05-13 03:28:22,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +27: [2023-05-13 03:28:22,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +29: [2023-05-13 03:28:22,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +29: [2023-05-13 03:28:22,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +29: [2023-05-13 03:28:22,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +29: [2023-05-13 03:28:22,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +29: [2023-05-13 03:28:22,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +29: [2023-05-13 03:28:22,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +29: [2023-05-13 03:28:22,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +29: [2023-05-13 03:28:22,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +29: [2023-05-13 03:28:22,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. +29: [2023-05-13 03:28:22,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_06-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +29: [2023-05-13 03:28:22,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +29: [2023-05-13 03:28:22,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +29: [2023-05-13 03:28:22,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +29: [2023-05-13 03:28:22,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +29: [2023-05-13 03:28:22,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +29: [2023-05-13 03:28:22,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +26: [2023-05-13 03:28:22,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +26: [2023-05-13 03:28:22,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +26: [2023-05-13 03:28:22,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +26: [2023-05-13 03:28:22,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +26: [2023-05-13 03:28:22,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +26: [2023-05-13 03:28:22,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +26: [2023-05-13 03:28:22,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +26: [2023-05-13 03:28:22,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +26: [2023-05-13 03:28:22,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +26: [2023-05-13 03:28:22,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +26: [2023-05-13 03:28:22,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +26: [2023-05-13 03:28:22,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +26: [2023-05-13 03:28:22,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +26: [2023-05-13 03:28:22,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +26: [2023-05-13 03:28:22,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +26: [2023-05-13 03:28:22,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +26: [2023-05-13 03:28:22,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +26: [2023-05-13 03:28:22,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +26: [2023-05-13 03:28:22,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +30: [2023-05-13 03:28:22,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +30: [2023-05-13 03:28:22,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +30: [2023-05-13 03:28:22,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +30: [2023-05-13 03:28:22,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +30: [2023-05-13 03:28:22,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +30: [2023-05-13 03:28:22,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +30: [2023-05-13 03:28:22,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +30: [2023-05-13 03:28:22,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +30: [2023-05-13 03:28:22,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +30: [2023-05-13 03:28:22,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +30: [2023-05-13 03:28:22,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +30: [2023-05-13 03:28:22,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +30: [2023-05-13 03:28:22,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +30: [2023-05-13 03:28:22,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +30: [2023-05-13 03:28:22,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +30: [2023-05-13 03:28:22,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +26: [2023-05-13 03:28:22,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +26: [2023-05-13 03:28:22,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +26: [2023-05-13 03:28:22,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +26: [2023-05-13 03:28:22,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +26: [2023-05-13 03:28:22,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +26: [2023-05-13 03:28:22,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +26: [2023-05-13 03:28:22,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +26: [2023-05-13 03:28:22,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +21: [2023-05-13 03:28:22,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +21: [2023-05-13 03:28:22,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +21: [2023-05-13 03:28:22,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +21: [2023-05-13 03:28:22,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +21: [2023-05-13 03:28:22,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +21: [2023-05-13 03:28:22,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +21: [2023-05-13 03:28:22,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +21: [2023-05-13 03:28:22,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 4: [2023-05-13 03:28:22,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +21: [2023-05-13 03:28:22,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +21: [2023-05-13 03:28:22,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +21: [2023-05-13 03:28:22,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +24: [2023-05-13 03:28:22,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +24: [2023-05-13 03:28:22,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +24: [2023-05-13 03:28:22,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +24: [2023-05-13 03:28:22,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +24: [2023-05-13 03:28:22,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +24: [2023-05-13 03:28:22,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +24: [2023-05-13 03:28:22,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +24: [2023-05-13 03:28:22,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 4: [2023-05-13 03:28:22,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +21: [2023-05-13 03:28:22,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +21: [2023-05-13 03:28:22,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +26: [2023-05-13 03:28:22,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +15: [2023-05-13 03:28:22,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +15: [2023-05-13 03:28:22,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +15: [2023-05-13 03:28:22,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +15: [2023-05-13 03:28:22,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +15: [2023-05-13 03:28:22,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +15: [2023-05-13 03:28:22,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +26: [2023-05-13 03:28:22,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +21: [2023-05-13 03:28:22,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +26: [2023-05-13 03:28:22,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +21: [2023-05-13 03:28:22,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +21: [2023-05-13 03:28:22,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +24: [2023-05-13 03:28:22,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +24: [2023-05-13 03:28:22,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +24: [2023-05-13 03:28:22,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +24: [2023-05-13 03:28:22,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +26: [2023-05-13 03:28:22,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +26: [2023-05-13 03:28:22,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +24: [2023-05-13 03:28:22,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +24: [2023-05-13 03:28:22,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +24: [2023-05-13 03:28:22,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +24: [2023-05-13 03:28:22,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +30: [2023-05-13 03:28:22,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +30: [2023-05-13 03:28:22,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +30: [2023-05-13 03:28:22,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +30: [2023-05-13 03:28:22,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +30: [2023-05-13 03:28:22,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +30: [2023-05-13 03:28:22,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +30: [2023-05-13 03:28:22,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +30: [2023-05-13 03:28:22,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +12: [2023-05-13 03:28:22,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +12: [2023-05-13 03:28:22,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +12: [2023-05-13 03:28:22,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +12: [2023-05-13 03:28:22,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +12: [2023-05-13 03:28:22,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +12: [2023-05-13 03:28:22,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +12: [2023-05-13 03:28:22,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +12: [2023-05-13 03:28:22,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +30: [2023-05-13 03:28:22,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +30: [2023-05-13 03:28:22,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +12: [2023-05-13 03:28:22,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +12: [2023-05-13 03:28:22,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +12: [2023-05-13 03:28:22,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +12: [2023-05-13 03:28:22,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +21: [2023-05-13 03:28:22,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +21: [2023-05-13 03:28:22,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +21: [2023-05-13 03:28:22,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +12: [2023-05-13 03:28:22,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +12: [2023-05-13 03:28:22,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +12: [2023-05-13 03:28:22,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +12: [2023-05-13 03:28:22,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +30: [2023-05-13 03:28:22,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +15: [2023-05-13 03:28:22,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +24: [2023-05-13 03:28:22,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +30: [2023-05-13 03:28:22,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +21: [2023-05-13 03:28:22,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +21: [2023-05-13 03:28:22,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +24: [2023-05-13 03:28:22,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +24: [2023-05-13 03:28:22,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +30: [2023-05-13 03:28:22,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +30: [2023-05-13 03:28:22,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +21: [2023-05-13 03:28:22,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +21: [2023-05-13 03:28:22,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +21: [2023-05-13 03:28:22,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +30: [2023-05-13 03:28:22,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +17: [2023-05-13 03:28:22,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +24: [2023-05-13 03:28:22,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +30: [2023-05-13 03:28:22,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +17: [2023-05-13 03:28:22,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +17: [2023-05-13 03:28:22,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +17: [2023-05-13 03:28:22,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +17: [2023-05-13 03:28:22,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +17: [2023-05-13 03:28:22,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +17: [2023-05-13 03:28:22,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +17: [2023-05-13 03:28:22,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +16: [2023-05-13 03:28:22,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +16: [2023-05-13 03:28:22,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +25: [2023-05-13 03:28:22,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +25: [2023-05-13 03:28:22,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +25: [2023-05-13 03:28:22,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +25: [2023-05-13 03:28:22,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +25: [2023-05-13 03:28:22,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +25: [2023-05-13 03:28:22,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +25: [2023-05-13 03:28:22,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +25: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +31: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +31: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +31: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +31: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +16: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +16: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +31: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +31: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +31: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +16: [2023-05-13 03:28:22,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +16: [2023-05-13 03:28:22,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +16: [2023-05-13 03:28:22,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +31: [2023-05-13 03:28:22,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +16: [2023-05-13 03:28:22,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +24: [2023-05-13 03:28:22,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +24: [2023-05-13 03:28:22,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +24: [2023-05-13 03:28:22,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +24: [2023-05-13 03:28:22,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +17: [2023-05-13 03:28:22,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +21: [2023-05-13 03:28:22,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +21: [2023-05-13 03:28:22,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +21: [2023-05-13 03:28:22,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +31: [2023-05-13 03:28:22,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +28: [2023-05-13 03:28:22,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +19: [2023-05-13 03:28:22,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +19: [2023-05-13 03:28:22,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +31: [2023-05-13 03:28:22,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +16: [2023-05-13 03:28:22,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +28: [2023-05-13 03:28:22,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +28: [2023-05-13 03:28:22,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +28: [2023-05-13 03:28:22,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +28: [2023-05-13 03:28:22,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +28: [2023-05-13 03:28:22,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +28: [2023-05-13 03:28:22,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +16: [2023-05-13 03:28:22,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +25: [2023-05-13 03:28:22,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +28: [2023-05-13 03:28:22,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +25: [2023-05-13 03:28:22,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 5: [2023-05-13 03:28:22,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 5: [2023-05-13 03:28:22,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +25: [2023-05-13 03:28:22,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 5: [2023-05-13 03:28:22,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +19: [2023-05-13 03:28:22,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +13: [2023-05-13 03:28:22,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +13: [2023-05-13 03:28:22,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +19: [2023-05-13 03:28:22,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +19: [2023-05-13 03:28:22,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +19: [2023-05-13 03:28:22,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +19: [2023-05-13 03:28:22,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +16: [2023-05-13 03:28:22,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +19: [2023-05-13 03:28:22,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +25: [2023-05-13 03:28:22,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +13: [2023-05-13 03:28:22,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +13: [2023-05-13 03:28:22,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +13: [2023-05-13 03:28:22,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +25: [2023-05-13 03:28:22,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +13: [2023-05-13 03:28:22,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +13: [2023-05-13 03:28:22,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +16: [2023-05-13 03:28:22,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +25: [2023-05-13 03:28:22,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +25: [2023-05-13 03:28:22,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +13: [2023-05-13 03:28:22,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +16: [2023-05-13 03:28:22,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 5: [2023-05-13 03:28:22,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 5: [2023-05-13 03:28:22,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +16: [2023-05-13 03:28:22,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +28: [2023-05-13 03:28:22,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +25: [2023-05-13 03:28:22,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +23: [2023-05-13 03:28:22,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +23: [2023-05-13 03:28:22,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +17: [2023-05-13 03:28:22,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +16: [2023-05-13 03:28:22,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +16: [2023-05-13 03:28:22,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +23: [2023-05-13 03:28:22,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +31: [2023-05-13 03:28:22,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +31: [2023-05-13 03:28:22,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +23: [2023-05-13 03:28:22,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +17: [2023-05-13 03:28:22,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 5: [2023-05-13 03:28:22,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 5: [2023-05-13 03:28:22,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +31: [2023-05-13 03:28:22,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +23: [2023-05-13 03:28:22,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +23: [2023-05-13 03:28:22,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +23: [2023-05-13 03:28:22,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +23: [2023-05-13 03:28:22,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +17: [2023-05-13 03:28:22,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +31: [2023-05-13 03:28:22,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +17: [2023-05-13 03:28:22,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +31: [2023-05-13 03:28:22,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +31: [2023-05-13 03:28:22,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +17: [2023-05-13 03:28:22,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +17: [2023-05-13 03:28:22,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +17: [2023-05-13 03:28:22,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +19: [2023-05-13 03:28:22,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +19: [2023-05-13 03:28:22,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +19: [2023-05-13 03:28:22,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +21: [2023-05-13 03:28:22,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +13: [2023-05-13 03:28:22,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +19: [2023-05-13 03:28:22,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +13: [2023-05-13 03:28:22,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +19: [2023-05-13 03:28:22,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +19: [2023-05-13 03:28:22,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +15: [2023-05-13 03:28:22,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +13: [2023-05-13 03:28:22,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +15: [2023-05-13 03:28:22,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +28: [2023-05-13 03:28:22,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +13: [2023-05-13 03:28:22,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +28: [2023-05-13 03:28:22,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +14: [2023-05-13 03:28:22,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +14: [2023-05-13 03:28:22,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +14: [2023-05-13 03:28:22,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +14: [2023-05-13 03:28:22,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +28: [2023-05-13 03:28:22,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +24: [2023-05-13 03:28:22,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +14: [2023-05-13 03:28:22,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +14: [2023-05-13 03:28:22,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +14: [2023-05-13 03:28:22,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +13: [2023-05-13 03:28:22,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +14: [2023-05-13 03:28:22,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +19: [2023-05-13 03:28:22,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +13: [2023-05-13 03:28:22,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +15: [2023-05-13 03:28:22,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +15: [2023-05-13 03:28:22,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +24: [2023-05-13 03:28:22,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +28: [2023-05-13 03:28:22,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +21: [2023-05-13 03:28:22,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +19: [2023-05-13 03:28:22,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +23: [2023-05-13 03:28:22,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +23: [2023-05-13 03:28:22,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +22: [2023-05-13 03:28:22,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +22: [2023-05-13 03:28:22,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +22: [2023-05-13 03:28:22,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +22: [2023-05-13 03:28:22,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +28: [2023-05-13 03:28:22,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +22: [2023-05-13 03:28:22,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +22: [2023-05-13 03:28:22,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +22: [2023-05-13 03:28:22,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +27: [2023-05-13 03:28:22,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +27: [2023-05-13 03:28:22,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +27: [2023-05-13 03:28:22,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +27: [2023-05-13 03:28:22,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +27: [2023-05-13 03:28:22,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +27: [2023-05-13 03:28:22,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +27: [2023-05-13 03:28:22,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +22: [2023-05-13 03:28:22,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +28: [2023-05-13 03:28:22,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +11: [2023-05-13 03:28:22,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +27: [2023-05-13 03:28:22,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +13: [2023-05-13 03:28:22,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +28: [2023-05-13 03:28:22,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +11: [2023-05-13 03:28:22,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +11: [2023-05-13 03:28:22,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +11: [2023-05-13 03:28:22,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +11: [2023-05-13 03:28:22,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +11: [2023-05-13 03:28:22,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +11: [2023-05-13 03:28:22,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +13: [2023-05-13 03:28:22,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +11: [2023-05-13 03:28:22,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +23: [2023-05-13 03:28:22,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +23: [2023-05-13 03:28:22,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +24: [2023-05-13 03:28:22,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +14: [2023-05-13 03:28:22,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +21: [2023-05-13 03:28:22,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +21: [2023-05-13 03:28:22,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +21: [2023-05-13 03:28:22,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +11: [2023-05-13 03:28:22,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +24: [2023-05-13 03:28:22,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +27: [2023-05-13 03:28:22,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +14: [2023-05-13 03:28:22,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +22: [2023-05-13 03:28:22,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +23: [2023-05-13 03:28:22,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +22: [2023-05-13 03:28:22,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +23: [2023-05-13 03:28:22,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +14: [2023-05-13 03:28:22,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +23: [2023-05-13 03:28:22,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +10: [2023-05-13 03:28:22,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +10: [2023-05-13 03:28:22,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +23: [2023-05-13 03:28:22,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +14: [2023-05-13 03:28:22,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +10: [2023-05-13 03:28:22,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +14: [2023-05-13 03:28:22,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +14: [2023-05-13 03:28:22,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +10: [2023-05-13 03:28:22,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +10: [2023-05-13 03:28:22,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +10: [2023-05-13 03:28:22,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +10: [2023-05-13 03:28:22,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 9: [2023-05-13 03:28:22,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 9: [2023-05-13 03:28:22,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 9: [2023-05-13 03:28:22,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 9: [2023-05-13 03:28:22,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 9: [2023-05-13 03:28:22,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +14: [2023-05-13 03:28:22,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 9: [2023-05-13 03:28:22,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +10: [2023-05-13 03:28:22,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +14: [2023-05-13 03:28:22,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +10: [2023-05-13 03:28:22,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +22: [2023-05-13 03:28:22,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +22: [2023-05-13 03:28:22,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +10: [2023-05-13 03:28:22,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +24: [2023-05-13 03:28:22,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +22: [2023-05-13 03:28:22,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +24: [2023-05-13 03:28:22,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +18: [2023-05-13 03:28:22,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +18: [2023-05-13 03:28:22,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +22: [2023-05-13 03:28:22,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +18: [2023-05-13 03:28:22,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +18: [2023-05-13 03:28:22,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +24: [2023-05-13 03:28:22,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +18: [2023-05-13 03:28:22,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +18: [2023-05-13 03:28:22,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +18: [2023-05-13 03:28:22,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +22: [2023-05-13 03:28:22,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +24: [2023-05-13 03:28:22,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +27: [2023-05-13 03:28:22,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +18: [2023-05-13 03:28:22,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +22: [2023-05-13 03:28:22,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +27: [2023-05-13 03:28:22,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +11: [2023-05-13 03:28:22,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +11: [2023-05-13 03:28:22,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +27: [2023-05-13 03:28:22,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +27: [2023-05-13 03:28:22,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +11: [2023-05-13 03:28:22,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +27: [2023-05-13 03:28:22,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +27: [2023-05-13 03:28:22,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +11: [2023-05-13 03:28:22,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +12: [2023-05-13 03:28:22,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +12: [2023-05-13 03:28:22,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +11: [2023-05-13 03:28:22,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +11: [2023-05-13 03:28:22,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +11: [2023-05-13 03:28:22,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +27: [2023-05-13 03:28:22,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +12: [2023-05-13 03:28:22,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +18: [2023-05-13 03:28:22,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +18: [2023-05-13 03:28:22,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +10: [2023-05-13 03:28:22,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +10: [2023-05-13 03:28:22,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +18: [2023-05-13 03:28:22,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +10: [2023-05-13 03:28:22,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +10: [2023-05-13 03:28:22,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +10: [2023-05-13 03:28:22,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +10: [2023-05-13 03:28:22,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +18: [2023-05-13 03:28:22,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +18: [2023-05-13 03:28:22,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +18: [2023-05-13 03:28:22,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +18: [2023-05-13 03:28:22,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +18: [2023-05-13 03:28:22,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 9: [2023-05-13 03:28:22,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +12: [2023-05-13 03:28:22,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +12: [2023-05-13 03:28:22,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +12: [2023-05-13 03:28:22,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +12: [2023-05-13 03:28:22,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +12: [2023-05-13 03:28:22,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 6: [2023-05-13 03:28:22,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 6: [2023-05-13 03:28:22,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +15: [2023-05-13 03:28:22,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +17: [2023-05-13 03:28:22,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +15: [2023-05-13 03:28:22,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +12: [2023-05-13 03:28:22,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +31: [2023-05-13 03:28:22,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +31: [2023-05-13 03:28:22,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +12: [2023-05-13 03:28:22,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +15: [2023-05-13 03:28:22,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +15: [2023-05-13 03:28:22,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +28: [2023-05-13 03:28:22,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +15: [2023-05-13 03:28:22,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +15: [2023-05-13 03:28:22,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +15: [2023-05-13 03:28:22,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +12: [2023-05-13 03:28:22,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +25: [2023-05-13 03:28:22,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +25: [2023-05-13 03:28:22,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +25: [2023-05-13 03:28:22,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +20: [2023-05-13 03:28:22,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +20: [2023-05-13 03:28:22,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +16: [2023-05-13 03:28:22,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +16: [2023-05-13 03:28:22,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +16: [2023-05-13 03:28:22,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +20: [2023-05-13 03:28:22,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +20: [2023-05-13 03:28:22,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +20: [2023-05-13 03:28:22,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +20: [2023-05-13 03:28:22,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +20: [2023-05-13 03:28:22,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +20: [2023-05-13 03:28:22,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +16: [2023-05-13 03:28:22,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +16: [2023-05-13 03:28:22,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +16: [2023-05-13 03:28:22,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +16: [2023-05-13 03:28:22,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 0: [2023-05-13 03:28:22,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 0: [2023-05-13 03:28:22,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +16: [2023-05-13 03:28:22,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +20: [2023-05-13 03:28:22,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +20: [2023-05-13 03:28:22,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +14: [2023-05-13 03:28:22,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +13: [2023-05-13 03:28:22,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +13: [2023-05-13 03:28:22,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +19: [2023-05-13 03:28:22,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +19: [2023-05-13 03:28:22,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +25: [2023-05-13 03:28:22,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +10: [2023-05-13 03:28:22,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +23: [2023-05-13 03:28:22,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +19: [2023-05-13 03:28:22,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +23: [2023-05-13 03:28:22,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +11: [2023-05-13 03:28:22,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 7: [2023-05-13 03:28:22,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +12: [2023-05-13 03:28:22,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +12: [2023-05-13 03:28:22,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +25: [2023-05-13 03:28:22,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +25: [2023-05-13 03:28:22,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +25: [2023-05-13 03:28:22,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +25: [2023-05-13 03:28:22,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +13: [2023-05-13 03:28:22,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 2: [2023-05-13 03:28:22,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +12: [2023-05-13 03:28:22,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +27: [2023-05-13 03:28:22,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +17: [2023-05-13 03:28:22,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +12: [2023-05-13 03:28:22,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 2: [2023-05-13 03:28:22,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +20: [2023-05-13 03:28:22,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +20: [2023-05-13 03:28:22,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +20: [2023-05-13 03:28:22,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +31: [2023-05-13 03:28:22,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +20: [2023-05-13 03:28:22,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +12: [2023-05-13 03:28:22,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +20: [2023-05-13 03:28:22,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +20: [2023-05-13 03:28:22,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +31: [2023-05-13 03:28:22,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +22: [2023-05-13 03:28:22,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +22: [2023-05-13 03:28:22,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 9: [2023-05-13 03:28:22,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +28: [2023-05-13 03:28:22,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +19: [2023-05-13 03:28:22,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +19: [2023-05-13 03:28:22,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +19: [2023-05-13 03:28:22,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +14: [2023-05-13 03:28:22,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +31: [2023-05-13 03:28:22,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +31: [2023-05-13 03:28:22,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +31: [2023-05-13 03:28:22,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +19: [2023-05-13 03:28:22,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +19: [2023-05-13 03:28:22,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +13: [2023-05-13 03:28:22,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +13: [2023-05-13 03:28:22,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +13: [2023-05-13 03:28:22,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +13: [2023-05-13 03:28:22,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +14: [2023-05-13 03:28:22,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +13: [2023-05-13 03:28:22,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +10: [2023-05-13 03:28:22,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +31: [2023-05-13 03:28:22,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +31: [2023-05-13 03:28:22,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +31: [2023-05-13 03:28:22,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +17: [2023-05-13 03:28:22,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +17: [2023-05-13 03:28:22,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 3: [2023-05-13 03:28:22,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 8: [2023-05-13 03:28:22,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +14: [2023-05-13 03:28:22,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +25: [2023-05-13 03:28:22,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +17: [2023-05-13 03:28:22,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +25: [2023-05-13 03:28:22,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:22,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +29: [2023-05-13 03:28:22,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +17: [2023-05-13 03:28:22,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 5: [2023-05-13 03:28:22,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 1: [2023-05-13 03:28:22,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 1: [2023-05-13 03:28:22,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +29: [2023-05-13 03:28:22,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +29: [2023-05-13 03:28:23,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +25: [2023-05-13 03:28:23,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 7: [2023-05-13 03:28:22,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +18: [2023-05-13 03:28:22,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +18: [2023-05-13 03:28:22,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +18: [2023-05-13 03:28:22,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +29: [2023-05-13 03:28:23,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +29: [2023-05-13 03:28:23,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +29: [2023-05-13 03:28:23,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +29: [2023-05-13 03:28:23,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +28: [2023-05-13 03:28:23,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +28: [2023-05-13 03:28:23,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +28: [2023-05-13 03:28:23,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +17: [2023-05-13 03:28:23,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +17: [2023-05-13 03:28:23,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +17: [2023-05-13 03:28:23,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +10: [2023-05-13 03:28:23,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +16: [2023-05-13 03:28:23,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +16: [2023-05-13 03:28:23,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +14: [2023-05-13 03:28:23,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 7: [2023-05-13 03:28:23,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 7: [2023-05-13 03:28:23,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +23: [2023-05-13 03:28:23,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +23: [2023-05-13 03:28:23,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 5: [2023-05-13 03:28:23,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +23: [2023-05-13 03:28:23,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +16: [2023-05-13 03:28:23,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +28: [2023-05-13 03:28:23,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +28: [2023-05-13 03:28:23,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +28: [2023-05-13 03:28:23,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +28: [2023-05-13 03:28:23,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +29: [2023-05-13 03:28:23,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +14: [2023-05-13 03:28:23,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +14: [2023-05-13 03:28:23,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +14: [2023-05-13 03:28:23,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +14: [2023-05-13 03:28:23,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 5: [2023-05-13 03:28:23,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +11: [2023-05-13 03:28:23,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +13: [2023-05-13 03:28:23,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +13: [2023-05-13 03:28:23,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +23: [2023-05-13 03:28:23,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +23: [2023-05-13 03:28:23,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +23: [2023-05-13 03:28:23,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +22: [2023-05-13 03:28:23,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +22: [2023-05-13 03:28:23,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +16: [2023-05-13 03:28:23,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +27: [2023-05-13 03:28:23,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +18: [2023-05-13 03:28:23,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +16: [2023-05-13 03:28:23,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +16: [2023-05-13 03:28:23,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +29: [2023-05-13 03:28:23,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +16: [2023-05-13 03:28:23,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +16: [2023-05-13 03:28:23,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... +23: [2023-05-13 03:28:23,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt... + 7: [2023-05-13 03:28:23,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +13: [2023-05-13 03:28:23,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +10: [2023-05-13 03:28:23,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +23: [2023-05-13 03:28:23,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +18: [2023-05-13 03:28:23,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +18: [2023-05-13 03:28:23,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +18: [2023-05-13 03:28:23,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +18: [2023-05-13 03:28:23,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +10: [2023-05-13 03:28:23,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +22: [2023-05-13 03:28:23,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +22: [2023-05-13 03:28:23,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +22: [2023-05-13 03:28:23,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +22: [2023-05-13 03:28:23,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +11: [2023-05-13 03:28:23,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +11: [2023-05-13 03:28:23,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +11: [2023-05-13 03:28:23,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 7: [2023-05-13 03:28:23,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +19: [2023-05-13 03:28:23,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +25: [2023-05-13 03:28:23,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +22: [2023-05-13 03:28:23,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +27: [2023-05-13 03:28:23,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +22: [2023-05-13 03:28:23,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +27: [2023-05-13 03:28:23,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 7: [2023-05-13 03:28:23,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +25: [2023-05-13 03:28:23,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +25: [2023-05-13 03:28:23,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +25: [2023-05-13 03:28:23,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 7: [2023-05-13 03:28:23,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +25: [2023-05-13 03:28:23,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 7: [2023-05-13 03:28:23,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +11: [2023-05-13 03:28:23,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +11: [2023-05-13 03:28:23,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +11: [2023-05-13 03:28:23,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +14: [2023-05-13 03:28:23,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +11: [2023-05-13 03:28:23,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +10: [2023-05-13 03:28:23,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +10: [2023-05-13 03:28:23,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +10: [2023-05-13 03:28:23,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +10: [2023-05-13 03:28:23,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +10: [2023-05-13 03:28:23,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +14: [2023-05-13 03:28:23,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +19: [2023-05-13 03:28:23,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +19: [2023-05-13 03:28:23,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 9: [2023-05-13 03:28:23,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +18: [2023-05-13 03:28:23,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +18: [2023-05-13 03:28:23,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +27: [2023-05-13 03:28:23,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +27: [2023-05-13 03:28:23,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +27: [2023-05-13 03:28:23,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +27: [2023-05-13 03:28:23,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +27: [2023-05-13 03:28:23,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +18: [2023-05-13 03:28:23,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +14: [2023-05-13 03:28:23,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 9: [2023-05-13 03:28:23,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 9: [2023-05-13 03:28:23,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 9: [2023-05-13 03:28:23,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +19: [2023-05-13 03:28:23,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +19: [2023-05-13 03:28:23,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 6: [2023-05-13 03:28:23,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 6: [2023-05-13 03:28:23,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 2: [2023-05-13 03:28:23,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +13: [2023-05-13 03:28:23,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +19: [2023-05-13 03:28:23,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +19: [2023-05-13 03:28:23,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +13: [2023-05-13 03:28:23,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +13: [2023-05-13 03:28:23,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +13: [2023-05-13 03:28:23,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +17: [2023-05-13 03:28:23,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +19: [2023-05-13 03:28:23,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +14: [2023-05-13 03:28:23,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +13: [2023-05-13 03:28:23,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +17: [2023-05-13 03:28:23,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +17: [2023-05-13 03:28:23,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +18: [2023-05-13 03:28:23,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +14: [2023-05-13 03:28:23,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +17: [2023-05-13 03:28:23,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +14: [2023-05-13 03:28:23,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +14: [2023-05-13 03:28:23,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +20: [2023-05-13 03:28:23,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +20: [2023-05-13 03:28:23,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +17: [2023-05-13 03:28:23,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +28: [2023-05-13 03:28:23,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +28: [2023-05-13 03:28:23,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +28: [2023-05-13 03:28:23,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +22: [2023-05-13 03:28:23,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +22: [2023-05-13 03:28:23,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +17: [2023-05-13 03:28:23,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +31: [2023-05-13 03:28:23,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +31: [2023-05-13 03:28:23,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +31: [2023-05-13 03:28:23,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +31: [2023-05-13 03:28:23,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +31: [2023-05-13 03:28:23,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +31: [2023-05-13 03:28:23,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +28: [2023-05-13 03:28:23,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +10: [2023-05-13 03:28:23,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 6: [2023-05-13 03:28:23,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 6: [2023-05-13 03:28:23,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 6: [2023-05-13 03:28:23,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 6: [2023-05-13 03:28:23,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +17: [2023-05-13 03:28:23,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +18: [2023-05-13 03:28:23,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +23: [2023-05-13 03:28:23,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +28: [2023-05-13 03:28:23,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +23: [2023-05-13 03:28:23,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +23: [2023-05-13 03:28:23,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +23: [2023-05-13 03:28:23,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +28: [2023-05-13 03:28:23,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +28: [2023-05-13 03:28:23,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +27: [2023-05-13 03:28:23,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +27: [2023-05-13 03:28:23,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +18: [2023-05-13 03:28:23,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +18: [2023-05-13 03:28:23,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +18: [2023-05-13 03:28:23,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +23: [2023-05-13 03:28:23,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +23: [2023-05-13 03:28:23,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +22: [2023-05-13 03:28:23,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +11: [2023-05-13 03:28:23,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +22: [2023-05-13 03:28:23,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +22: [2023-05-13 03:28:23,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +11: [2023-05-13 03:28:23,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +22: [2023-05-13 03:28:23,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +10: [2023-05-13 03:28:23,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +10: [2023-05-13 03:28:23,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +11: [2023-05-13 03:28:23,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 2: [2023-05-13 03:28:23,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +11: [2023-05-13 03:28:23,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 2: [2023-05-13 03:28:23,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +10: [2023-05-13 03:28:23,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +10: [2023-05-13 03:28:23,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 6: [2023-05-13 03:28:23,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +29: [2023-05-13 03:28:23,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +10: [2023-05-13 03:28:23,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +11: [2023-05-13 03:28:23,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 2: [2023-05-13 03:28:23,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 9: [2023-05-13 03:28:23,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +11: [2023-05-13 03:28:23,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +20: [2023-05-13 03:28:23,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +20: [2023-05-13 03:28:23,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +20: [2023-05-13 03:28:23,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +11: [2023-05-13 03:28:23,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +27: [2023-05-13 03:28:23,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +27: [2023-05-13 03:28:23,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +27: [2023-05-13 03:28:23,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +27: [2023-05-13 03:28:23,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +20: [2023-05-13 03:28:23,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +20: [2023-05-13 03:28:23,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +20: [2023-05-13 03:28:23,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +20: [2023-05-13 03:28:23,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +20: [2023-05-13 03:28:23,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +27: [2023-05-13 03:28:23,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 6: [2023-05-13 03:28:23,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +29: [2023-05-13 03:28:23,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +29: [2023-05-13 03:28:23,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +29: [2023-05-13 03:28:23,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. +29: [2023-05-13 03:28:23,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_07-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 2: [2023-05-13 03:28:23,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +20: [2023-05-13 03:28:23,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +20: [2023-05-13 03:28:23,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +20: [2023-05-13 03:28:23,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +20: [2023-05-13 03:28:23,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +20: [2023-05-13 03:28:23,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +20: [2023-05-13 03:28:23,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 2: [2023-05-13 03:28:23,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 2: [2023-05-13 03:28:23,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 2: [2023-05-13 03:28:23,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 2: [2023-05-13 03:28:23,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +15: [2023-05-13 03:28:23,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +15: [2023-05-13 03:28:23,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +15: [2023-05-13 03:28:23,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +15: [2023-05-13 03:28:23,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +15: [2023-05-13 03:28:23,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +15: [2023-05-13 03:28:23,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +15: [2023-05-13 03:28:23,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +15: [2023-05-13 03:28:23,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +15: [2023-05-13 03:28:23,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +15: [2023-05-13 03:28:23,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +15: [2023-05-13 03:28:23,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +15: [2023-05-13 03:28:23,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +15: [2023-05-13 03:28:23,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +15: [2023-05-13 03:28:23,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +15: [2023-05-13 03:28:23,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +15: [2023-05-13 03:28:23,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +30: [2023-05-13 03:28:23,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +30: [2023-05-13 03:28:23,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +30: [2023-05-13 03:28:23,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +30: [2023-05-13 03:28:23,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +30: [2023-05-13 03:28:23,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +30: [2023-05-13 03:28:23,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +30: [2023-05-13 03:28:23,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +30: [2023-05-13 03:28:23,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 0: [2023-05-13 03:28:23,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +14: [2023-05-13 03:28:23,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +14: [2023-05-13 03:28:23,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +14: [2023-05-13 03:28:23,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +14: [2023-05-13 03:28:23,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +14: [2023-05-13 03:28:23,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +14: [2023-05-13 03:28:23,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +14: [2023-05-13 03:28:23,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +14: [2023-05-13 03:28:23,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 0: [2023-05-13 03:28:23,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 0: [2023-05-13 03:28:23,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 0: [2023-05-13 03:28:23,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 0: [2023-05-13 03:28:23,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 0: [2023-05-13 03:28:23,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 0: [2023-05-13 03:28:23,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 0: [2023-05-13 03:28:23,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +30: [2023-05-13 03:28:23,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +31: [2023-05-13 03:28:23,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +31: [2023-05-13 03:28:23,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +31: [2023-05-13 03:28:23,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +31: [2023-05-13 03:28:23,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +31: [2023-05-13 03:28:23,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +31: [2023-05-13 03:28:23,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +31: [2023-05-13 03:28:23,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +31: [2023-05-13 03:28:23,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +26: [2023-05-13 03:28:23,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +26: [2023-05-13 03:28:23,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +26: [2023-05-13 03:28:23,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +26: [2023-05-13 03:28:23,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +26: [2023-05-13 03:28:23,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +26: [2023-05-13 03:28:23,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +26: [2023-05-13 03:28:23,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +26: [2023-05-13 03:28:23,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +30: [2023-05-13 03:28:23,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +30: [2023-05-13 03:28:23,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +30: [2023-05-13 03:28:23,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +30: [2023-05-13 03:28:23,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +30: [2023-05-13 03:28:23,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +30: [2023-05-13 03:28:23,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 0: [2023-05-13 03:28:23,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +30: [2023-05-13 03:28:23,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +31: [2023-05-13 03:28:23,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +31: [2023-05-13 03:28:23,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +14: [2023-05-13 03:28:23,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +14: [2023-05-13 03:28:23,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +14: [2023-05-13 03:28:23,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +14: [2023-05-13 03:28:23,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +14: [2023-05-13 03:28:23,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +26: [2023-05-13 03:28:23,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +26: [2023-05-13 03:28:23,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +14: [2023-05-13 03:28:23,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +26: [2023-05-13 03:28:23,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +14: [2023-05-13 03:28:23,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 0: [2023-05-13 03:28:23,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 0: [2023-05-13 03:28:23,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +14: [2023-05-13 03:28:23,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 0: [2023-05-13 03:28:23,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 0: [2023-05-13 03:28:23,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 0: [2023-05-13 03:28:23,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 0: [2023-05-13 03:28:23,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +31: [2023-05-13 03:28:23,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +31: [2023-05-13 03:28:23,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +26: [2023-05-13 03:28:23,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +26: [2023-05-13 03:28:23,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +26: [2023-05-13 03:28:23,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +31: [2023-05-13 03:28:23,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 0: [2023-05-13 03:28:23,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +31: [2023-05-13 03:28:23,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +31: [2023-05-13 03:28:23,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +31: [2023-05-13 03:28:23,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +26: [2023-05-13 03:28:23,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +26: [2023-05-13 03:28:23,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +15: [2023-05-13 03:28:23,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +15: [2023-05-13 03:28:23,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +30: [2023-05-13 03:28:23,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +18: [2023-05-13 03:28:23,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +18: [2023-05-13 03:28:23,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +18: [2023-05-13 03:28:23,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +18: [2023-05-13 03:28:23,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +18: [2023-05-13 03:28:23,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +18: [2023-05-13 03:28:23,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +18: [2023-05-13 03:28:23,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +18: [2023-05-13 03:28:23,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +15: [2023-05-13 03:28:23,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +15: [2023-05-13 03:28:23,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +31: [2023-05-13 03:28:23,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +31: [2023-05-13 03:28:23,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +15: [2023-05-13 03:28:23,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +15: [2023-05-13 03:28:23,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +15: [2023-05-13 03:28:23,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +15: [2023-05-13 03:28:23,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +15: [2023-05-13 03:28:23,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +30: [2023-05-13 03:28:23,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +30: [2023-05-13 03:28:23,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 0: [2023-05-13 03:28:23,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +18: [2023-05-13 03:28:23,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +18: [2023-05-13 03:28:23,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +30: [2023-05-13 03:28:23,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +18: [2023-05-13 03:28:23,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +14: [2023-05-13 03:28:23,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +14: [2023-05-13 03:28:23,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +18: [2023-05-13 03:28:23,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +18: [2023-05-13 03:28:23,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +18: [2023-05-13 03:28:23,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +18: [2023-05-13 03:28:23,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +14: [2023-05-13 03:28:23,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +26: [2023-05-13 03:28:23,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +26: [2023-05-13 03:28:23,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +26: [2023-05-13 03:28:23,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +18: [2023-05-13 03:28:23,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +30: [2023-05-13 03:28:23,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +14: [2023-05-13 03:28:23,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +30: [2023-05-13 03:28:23,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +30: [2023-05-13 03:28:23,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +30: [2023-05-13 03:28:23,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +30: [2023-05-13 03:28:23,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +26: [2023-05-13 03:28:23,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +26: [2023-05-13 03:28:23,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +26: [2023-05-13 03:28:23,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +14: [2023-05-13 03:28:23,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +14: [2023-05-13 03:28:23,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +14: [2023-05-13 03:28:23,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +14: [2023-05-13 03:28:23,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +26: [2023-05-13 03:28:23,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +26: [2023-05-13 03:28:23,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +31: [2023-05-13 03:28:23,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +31: [2023-05-13 03:28:23,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +31: [2023-05-13 03:28:23,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +31: [2023-05-13 03:28:23,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +31: [2023-05-13 03:28:23,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +23: [2023-05-13 03:28:23,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +30: [2023-05-13 03:28:23,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:23,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +23: [2023-05-13 03:28:23,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +23: [2023-05-13 03:28:23,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +23: [2023-05-13 03:28:23,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +31: [2023-05-13 03:28:23,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +31: [2023-05-13 03:28:23,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +31: [2023-05-13 03:28:23,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +23: [2023-05-13 03:28:23,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +23: [2023-05-13 03:28:23,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +30: [2023-05-13 03:28:23,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:23,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 0: [2023-05-13 03:28:23,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +14: [2023-05-13 03:28:23,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +30: [2023-05-13 03:28:23,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +27: [2023-05-13 03:28:23,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +27: [2023-05-13 03:28:23,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +27: [2023-05-13 03:28:23,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +27: [2023-05-13 03:28:23,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +27: [2023-05-13 03:28:23,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +27: [2023-05-13 03:28:23,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +27: [2023-05-13 03:28:23,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +27: [2023-05-13 03:28:23,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +26: [2023-05-13 03:28:23,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:23,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +23: [2023-05-13 03:28:23,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +27: [2023-05-13 03:28:23,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 0: [2023-05-13 03:28:23,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 0: [2023-05-13 03:28:23,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 0: [2023-05-13 03:28:23,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 0: [2023-05-13 03:28:23,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 0: [2023-05-13 03:28:23,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 0: [2023-05-13 03:28:23,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 0: [2023-05-13 03:28:23,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +14: [2023-05-13 03:28:23,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +26: [2023-05-13 03:28:23,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +26: [2023-05-13 03:28:23,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +15: [2023-05-13 03:28:23,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +15: [2023-05-13 03:28:23,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +15: [2023-05-13 03:28:23,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:23,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +23: [2023-05-13 03:28:23,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +23: [2023-05-13 03:28:23,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +23: [2023-05-13 03:28:23,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +23: [2023-05-13 03:28:23,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +15: [2023-05-13 03:28:23,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +15: [2023-05-13 03:28:23,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +15: [2023-05-13 03:28:23,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +15: [2023-05-13 03:28:23,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:23,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +27: [2023-05-13 03:28:23,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +30: [2023-05-13 03:28:23,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +27: [2023-05-13 03:28:23,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +27: [2023-05-13 03:28:23,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +27: [2023-05-13 03:28:23,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +14: [2023-05-13 03:28:23,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +26: [2023-05-13 03:28:23,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +27: [2023-05-13 03:28:23,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +26: [2023-05-13 03:28:23,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +26: [2023-05-13 03:28:23,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +27: [2023-05-13 03:28:23,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +30: [2023-05-13 03:28:23,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +27: [2023-05-13 03:28:23,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +30: [2023-05-13 03:28:23,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +30: [2023-05-13 03:28:23,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +13: [2023-05-13 03:28:23,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +13: [2023-05-13 03:28:23,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +13: [2023-05-13 03:28:23,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +13: [2023-05-13 03:28:23,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +13: [2023-05-13 03:28:23,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +13: [2023-05-13 03:28:23,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +13: [2023-05-13 03:28:23,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +13: [2023-05-13 03:28:23,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +31: [2023-05-13 03:28:23,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +26: [2023-05-13 03:28:23,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +26: [2023-05-13 03:28:23,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +31: [2023-05-13 03:28:23,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +14: [2023-05-13 03:28:23,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +21: [2023-05-13 03:28:23,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +21: [2023-05-13 03:28:23,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +21: [2023-05-13 03:28:23,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +21: [2023-05-13 03:28:23,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +21: [2023-05-13 03:28:23,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +21: [2023-05-13 03:28:23,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +21: [2023-05-13 03:28:23,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +14: [2023-05-13 03:28:23,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +21: [2023-05-13 03:28:23,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +14: [2023-05-13 03:28:23,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +13: [2023-05-13 03:28:23,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +13: [2023-05-13 03:28:23,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +31: [2023-05-13 03:28:23,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +14: [2023-05-13 03:28:23,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +14: [2023-05-13 03:28:23,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +13: [2023-05-13 03:28:23,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +13: [2023-05-13 03:28:23,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +13: [2023-05-13 03:28:23,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +13: [2023-05-13 03:28:23,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +13: [2023-05-13 03:28:23,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +13: [2023-05-13 03:28:23,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +21: [2023-05-13 03:28:23,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +21: [2023-05-13 03:28:23,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +21: [2023-05-13 03:28:23,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +31: [2023-05-13 03:28:23,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +31: [2023-05-13 03:28:23,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +18: [2023-05-13 03:28:23,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +18: [2023-05-13 03:28:23,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +18: [2023-05-13 03:28:23,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +31: [2023-05-13 03:28:23,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +21: [2023-05-13 03:28:23,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 4: [2023-05-13 03:28:23,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 4: [2023-05-13 03:28:23,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 4: [2023-05-13 03:28:23,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +21: [2023-05-13 03:28:23,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 4: [2023-05-13 03:28:23,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 4: [2023-05-13 03:28:23,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 4: [2023-05-13 03:28:23,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 4: [2023-05-13 03:28:23,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +21: [2023-05-13 03:28:23,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 4: [2023-05-13 03:28:23,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +21: [2023-05-13 03:28:23,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +21: [2023-05-13 03:28:23,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +18: [2023-05-13 03:28:23,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 4: [2023-05-13 03:28:23,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 4: [2023-05-13 03:28:23,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 4: [2023-05-13 03:28:23,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 4: [2023-05-13 03:28:23,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 4: [2023-05-13 03:28:23,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +19: [2023-05-13 03:28:23,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 4: [2023-05-13 03:28:23,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 4: [2023-05-13 03:28:23,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +19: [2023-05-13 03:28:23,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +19: [2023-05-13 03:28:23,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +19: [2023-05-13 03:28:23,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +19: [2023-05-13 03:28:23,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +19: [2023-05-13 03:28:23,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +19: [2023-05-13 03:28:23,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +19: [2023-05-13 03:28:23,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 4: [2023-05-13 03:28:23,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 0: [2023-05-13 03:28:23,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +18: [2023-05-13 03:28:23,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +18: [2023-05-13 03:28:23,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +18: [2023-05-13 03:28:23,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +18: [2023-05-13 03:28:23,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 0: [2023-05-13 03:28:23,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 6: [2023-05-13 03:28:23,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 6: [2023-05-13 03:28:23,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 6: [2023-05-13 03:28:23,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 6: [2023-05-13 03:28:23,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 6: [2023-05-13 03:28:23,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 6: [2023-05-13 03:28:23,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 0: [2023-05-13 03:28:23,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 0: [2023-05-13 03:28:23,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +11: [2023-05-13 03:28:23,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 0: [2023-05-13 03:28:23,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +11: [2023-05-13 03:28:23,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +11: [2023-05-13 03:28:23,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +11: [2023-05-13 03:28:23,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +11: [2023-05-13 03:28:23,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +11: [2023-05-13 03:28:23,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +11: [2023-05-13 03:28:23,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +19: [2023-05-13 03:28:23,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +11: [2023-05-13 03:28:23,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +19: [2023-05-13 03:28:23,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 0: [2023-05-13 03:28:23,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +19: [2023-05-13 03:28:23,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +19: [2023-05-13 03:28:23,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +19: [2023-05-13 03:28:23,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 0: [2023-05-13 03:28:23,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +19: [2023-05-13 03:28:23,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +19: [2023-05-13 03:28:23,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +19: [2023-05-13 03:28:23,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +11: [2023-05-13 03:28:23,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +18: [2023-05-13 03:28:23,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +18: [2023-05-13 03:28:23,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +11: [2023-05-13 03:28:23,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +11: [2023-05-13 03:28:23,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +18: [2023-05-13 03:28:23,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +11: [2023-05-13 03:28:23,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +11: [2023-05-13 03:28:23,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +23: [2023-05-13 03:28:23,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +27: [2023-05-13 03:28:23,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +11: [2023-05-13 03:28:23,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +11: [2023-05-13 03:28:23,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +23: [2023-05-13 03:28:23,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +11: [2023-05-13 03:28:23,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +18: [2023-05-13 03:28:23,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +18: [2023-05-13 03:28:23,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +18: [2023-05-13 03:28:23,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +18: [2023-05-13 03:28:23,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +18: [2023-05-13 03:28:23,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +13: [2023-05-13 03:28:23,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +13: [2023-05-13 03:28:23,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +13: [2023-05-13 03:28:23,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +27: [2023-05-13 03:28:23,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +21: [2023-05-13 03:28:23,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +21: [2023-05-13 03:28:23,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +21: [2023-05-13 03:28:23,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +23: [2023-05-13 03:28:23,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +23: [2023-05-13 03:28:23,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +23: [2023-05-13 03:28:23,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +23: [2023-05-13 03:28:23,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +23: [2023-05-13 03:28:23,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +23: [2023-05-13 03:28:23,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:23,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +23: [2023-05-13 03:28:23,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +13: [2023-05-13 03:28:23,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +13: [2023-05-13 03:28:23,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +13: [2023-05-13 03:28:23,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +13: [2023-05-13 03:28:23,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +27: [2023-05-13 03:28:23,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +27: [2023-05-13 03:28:23,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +13: [2023-05-13 03:28:23,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +21: [2023-05-13 03:28:23,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 4: [2023-05-13 03:28:23,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +21: [2023-05-13 03:28:23,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +21: [2023-05-13 03:28:23,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +21: [2023-05-13 03:28:23,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +21: [2023-05-13 03:28:23,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 7: [2023-05-13 03:28:23,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 7: [2023-05-13 03:28:23,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 7: [2023-05-13 03:28:23,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 7: [2023-05-13 03:28:23,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 7: [2023-05-13 03:28:23,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 7: [2023-05-13 03:28:23,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 7: [2023-05-13 03:28:23,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 7: [2023-05-13 03:28:23,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 4: [2023-05-13 03:28:23,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 4: [2023-05-13 03:28:23,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 9: [2023-05-13 03:28:23,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 9: [2023-05-13 03:28:23,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 9: [2023-05-13 03:28:23,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 9: [2023-05-13 03:28:23,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 9: [2023-05-13 03:28:23,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 9: [2023-05-13 03:28:23,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 9: [2023-05-13 03:28:23,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 4: [2023-05-13 03:28:23,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 4: [2023-05-13 03:28:23,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 4: [2023-05-13 03:28:23,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 4: [2023-05-13 03:28:23,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 4: [2023-05-13 03:28:23,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +10: [2023-05-13 03:28:23,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 9: [2023-05-13 03:28:23,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +10: [2023-05-13 03:28:23,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +10: [2023-05-13 03:28:23,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +27: [2023-05-13 03:28:23,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +27: [2023-05-13 03:28:23,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +27: [2023-05-13 03:28:23,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +27: [2023-05-13 03:28:23,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +27: [2023-05-13 03:28:23,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +10: [2023-05-13 03:28:23,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +10: [2023-05-13 03:28:23,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +10: [2023-05-13 03:28:23,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +11: [2023-05-13 03:28:23,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +10: [2023-05-13 03:28:23,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +10: [2023-05-13 03:28:23,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +29: [2023-05-13 03:28:23,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +29: [2023-05-13 03:28:23,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +29: [2023-05-13 03:28:23,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +29: [2023-05-13 03:28:23,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +29: [2023-05-13 03:28:23,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +29: [2023-05-13 03:28:23,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +29: [2023-05-13 03:28:23,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +21: [2023-05-13 03:28:23,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +10: [2023-05-13 03:28:23,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 9: [2023-05-13 03:28:23,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +10: [2023-05-13 03:28:23,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +22: [2023-05-13 03:28:23,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +22: [2023-05-13 03:28:23,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +21: [2023-05-13 03:28:23,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +22: [2023-05-13 03:28:23,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +22: [2023-05-13 03:28:23,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 7: [2023-05-13 03:28:23,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 7: [2023-05-13 03:28:23,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +22: [2023-05-13 03:28:23,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +22: [2023-05-13 03:28:23,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +22: [2023-05-13 03:28:23,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +22: [2023-05-13 03:28:23,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +21: [2023-05-13 03:28:23,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 7: [2023-05-13 03:28:23,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 2: [2023-05-13 03:28:23,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 2: [2023-05-13 03:28:23,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 7: [2023-05-13 03:28:23,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 7: [2023-05-13 03:28:23,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +19: [2023-05-13 03:28:23,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +19: [2023-05-13 03:28:23,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +19: [2023-05-13 03:28:23,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +19: [2023-05-13 03:28:23,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +19: [2023-05-13 03:28:23,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 7: [2023-05-13 03:28:23,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 7: [2023-05-13 03:28:23,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +13: [2023-05-13 03:28:23,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 7: [2023-05-13 03:28:23,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 1: [2023-05-13 03:28:23,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +16: [2023-05-13 03:28:23,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +16: [2023-05-13 03:28:23,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +10: [2023-05-13 03:28:23,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +12: [2023-05-13 03:28:23,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +12: [2023-05-13 03:28:23,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +12: [2023-05-13 03:28:23,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +20: [2023-05-13 03:28:23,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +20: [2023-05-13 03:28:23,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +20: [2023-05-13 03:28:23,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +20: [2023-05-13 03:28:23,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +10: [2023-05-13 03:28:23,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +12: [2023-05-13 03:28:23,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +12: [2023-05-13 03:28:23,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +12: [2023-05-13 03:28:23,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +12: [2023-05-13 03:28:23,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +20: [2023-05-13 03:28:23,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +20: [2023-05-13 03:28:23,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +20: [2023-05-13 03:28:23,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +22: [2023-05-13 03:28:23,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +22: [2023-05-13 03:28:23,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +10: [2023-05-13 03:28:23,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +12: [2023-05-13 03:28:23,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +13: [2023-05-13 03:28:23,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +20: [2023-05-13 03:28:23,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +10: [2023-05-13 03:28:23,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +10: [2023-05-13 03:28:23,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 2: [2023-05-13 03:28:23,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 2: [2023-05-13 03:28:23,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +13: [2023-05-13 03:28:23,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +10: [2023-05-13 03:28:23,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 2: [2023-05-13 03:28:23,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 2: [2023-05-13 03:28:23,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +16: [2023-05-13 03:28:23,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +16: [2023-05-13 03:28:23,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +16: [2023-05-13 03:28:23,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +16: [2023-05-13 03:28:23,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +16: [2023-05-13 03:28:23,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +16: [2023-05-13 03:28:23,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 5: [2023-05-13 03:28:23,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 5: [2023-05-13 03:28:23,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +29: [2023-05-13 03:28:23,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 5: [2023-05-13 03:28:23,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 5: [2023-05-13 03:28:23,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 5: [2023-05-13 03:28:23,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 5: [2023-05-13 03:28:23,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +29: [2023-05-13 03:28:23,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +22: [2023-05-13 03:28:23,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +22: [2023-05-13 03:28:23,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +29: [2023-05-13 03:28:23,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +27: [2023-05-13 03:28:23,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +29: [2023-05-13 03:28:23,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +22: [2023-05-13 03:28:23,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +20: [2023-05-13 03:28:23,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +16: [2023-05-13 03:28:23,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +16: [2023-05-13 03:28:23,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +20: [2023-05-13 03:28:23,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +22: [2023-05-13 03:28:23,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +12: [2023-05-13 03:28:23,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +12: [2023-05-13 03:28:23,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +12: [2023-05-13 03:28:23,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +12: [2023-05-13 03:28:23,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +23: [2023-05-13 03:28:23,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +22: [2023-05-13 03:28:23,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +12: [2023-05-13 03:28:23,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +12: [2023-05-13 03:28:23,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +22: [2023-05-13 03:28:23,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +27: [2023-05-13 03:28:23,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +12: [2023-05-13 03:28:23,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +12: [2023-05-13 03:28:23,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 4: [2023-05-13 03:28:23,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:23,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +16: [2023-05-13 03:28:23,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +20: [2023-05-13 03:28:23,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +23: [2023-05-13 03:28:23,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +19: [2023-05-13 03:28:23,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +19: [2023-05-13 03:28:23,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +20: [2023-05-13 03:28:23,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +20: [2023-05-13 03:28:23,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +19: [2023-05-13 03:28:23,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +16: [2023-05-13 03:28:23,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +16: [2023-05-13 03:28:23,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +28: [2023-05-13 03:28:23,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +28: [2023-05-13 03:28:23,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +28: [2023-05-13 03:28:23,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +28: [2023-05-13 03:28:23,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +28: [2023-05-13 03:28:23,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +28: [2023-05-13 03:28:23,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +28: [2023-05-13 03:28:23,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +28: [2023-05-13 03:28:23,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +20: [2023-05-13 03:28:23,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +16: [2023-05-13 03:28:23,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +20: [2023-05-13 03:28:23,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +16: [2023-05-13 03:28:23,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +20: [2023-05-13 03:28:23,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +11: [2023-05-13 03:28:23,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +16: [2023-05-13 03:28:23,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +23: [2023-05-13 03:28:23,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:23,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +24: [2023-05-13 03:28:23,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +24: [2023-05-13 03:28:23,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +24: [2023-05-13 03:28:23,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +24: [2023-05-13 03:28:23,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +23: [2023-05-13 03:28:23,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +24: [2023-05-13 03:28:23,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +24: [2023-05-13 03:28:23,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +24: [2023-05-13 03:28:23,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +21: [2023-05-13 03:28:23,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +24: [2023-05-13 03:28:23,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 5: [2023-05-13 03:28:23,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 4: [2023-05-13 03:28:23,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +13: [2023-05-13 03:28:23,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +28: [2023-05-13 03:28:23,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +25: [2023-05-13 03:28:23,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +25: [2023-05-13 03:28:23,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +25: [2023-05-13 03:28:23,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +25: [2023-05-13 03:28:23,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +25: [2023-05-13 03:28:23,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +25: [2023-05-13 03:28:23,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +25: [2023-05-13 03:28:23,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +25: [2023-05-13 03:28:23,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 6: [2023-05-13 03:28:23,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +13: [2023-05-13 03:28:23,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +13: [2023-05-13 03:28:23,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +21: [2023-05-13 03:28:23,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 4: [2023-05-13 03:28:23,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +13: [2023-05-13 03:28:23,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +13: [2023-05-13 03:28:23,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 4: [2023-05-13 03:28:23,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 4: [2023-05-13 03:28:23,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 4: [2023-05-13 03:28:23,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +21: [2023-05-13 03:28:23,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +21: [2023-05-13 03:28:23,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +24: [2023-05-13 03:28:23,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 4: [2023-05-13 03:28:23,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +21: [2023-05-13 03:28:23,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +24: [2023-05-13 03:28:23,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +24: [2023-05-13 03:28:23,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +11: [2023-05-13 03:28:23,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +11: [2023-05-13 03:28:23,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +11: [2023-05-13 03:28:23,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +25: [2023-05-13 03:28:23,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +25: [2023-05-13 03:28:23,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 4: [2023-05-13 03:28:23,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +24: [2023-05-13 03:28:23,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +25: [2023-05-13 03:28:23,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +24: [2023-05-13 03:28:23,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +24: [2023-05-13 03:28:23,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +28: [2023-05-13 03:28:23,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +24: [2023-05-13 03:28:23,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +28: [2023-05-13 03:28:23,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +24: [2023-05-13 03:28:23,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +28: [2023-05-13 03:28:23,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:23,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +25: [2023-05-13 03:28:23,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +25: [2023-05-13 03:28:23,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +25: [2023-05-13 03:28:23,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +17: [2023-05-13 03:28:23,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +17: [2023-05-13 03:28:23,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +17: [2023-05-13 03:28:23,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +28: [2023-05-13 03:28:23,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +25: [2023-05-13 03:28:23,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +17: [2023-05-13 03:28:23,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +17: [2023-05-13 03:28:23,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +17: [2023-05-13 03:28:23,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +17: [2023-05-13 03:28:23,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +28: [2023-05-13 03:28:23,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +25: [2023-05-13 03:28:23,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +28: [2023-05-13 03:28:23,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +28: [2023-05-13 03:28:23,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +11: [2023-05-13 03:28:23,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +11: [2023-05-13 03:28:23,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +11: [2023-05-13 03:28:23,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +11: [2023-05-13 03:28:23,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +17: [2023-05-13 03:28:23,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +27: [2023-05-13 03:28:23,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +27: [2023-05-13 03:28:23,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +27: [2023-05-13 03:28:23,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +27: [2023-05-13 03:28:23,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 6: [2023-05-13 03:28:23,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 6: [2023-05-13 03:28:23,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 6: [2023-05-13 03:28:23,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 6: [2023-05-13 03:28:23,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +19: [2023-05-13 03:28:23,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +19: [2023-05-13 03:28:23,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +27: [2023-05-13 03:28:23,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +19: [2023-05-13 03:28:23,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +19: [2023-05-13 03:28:23,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +19: [2023-05-13 03:28:23,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 1: [2023-05-13 03:28:23,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:23,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +17: [2023-05-13 03:28:23,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +17: [2023-05-13 03:28:23,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +10: [2023-05-13 03:28:23,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +17: [2023-05-13 03:28:23,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +17: [2023-05-13 03:28:23,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +17: [2023-05-13 03:28:23,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +17: [2023-05-13 03:28:23,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +19: [2023-05-13 03:28:23,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +19: [2023-05-13 03:28:23,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +19: [2023-05-13 03:28:23,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +29: [2023-05-13 03:28:23,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +29: [2023-05-13 03:28:23,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 8: [2023-05-13 03:28:23,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +10: [2023-05-13 03:28:23,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 7: [2023-05-13 03:28:23,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 7: [2023-05-13 03:28:23,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +11: [2023-05-13 03:28:23,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 7: [2023-05-13 03:28:23,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 8: [2023-05-13 03:28:23,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +22: [2023-05-13 03:28:23,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +22: [2023-05-13 03:28:23,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +10: [2023-05-13 03:28:23,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +11: [2023-05-13 03:28:23,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +11: [2023-05-13 03:28:23,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +12: [2023-05-13 03:28:23,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +12: [2023-05-13 03:28:23,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +11: [2023-05-13 03:28:23,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +11: [2023-05-13 03:28:23,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 7: [2023-05-13 03:28:23,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 7: [2023-05-13 03:28:23,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 6: [2023-05-13 03:28:23,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 6: [2023-05-13 03:28:23,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +12: [2023-05-13 03:28:23,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 7: [2023-05-13 03:28:23,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 7: [2023-05-13 03:28:23,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 7: [2023-05-13 03:28:23,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +11: [2023-05-13 03:28:23,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +11: [2023-05-13 03:28:23,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +29: [2023-05-13 03:28:23,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +20: [2023-05-13 03:28:23,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +20: [2023-05-13 03:28:23,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +28: [2023-05-13 03:28:23,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +16: [2023-05-13 03:28:23,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +16: [2023-05-13 03:28:23,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +16: [2023-05-13 03:28:23,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +24: [2023-05-13 03:28:23,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 9: [2023-05-13 03:28:23,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 5: [2023-05-13 03:28:23,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 5: [2023-05-13 03:28:23,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +29: [2023-05-13 03:28:23,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +29: [2023-05-13 03:28:23,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +10: [2023-05-13 03:28:23,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +17: [2023-05-13 03:28:23,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +16: [2023-05-13 03:28:23,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +16: [2023-05-13 03:28:23,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +16: [2023-05-13 03:28:23,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +16: [2023-05-13 03:28:23,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +10: [2023-05-13 03:28:23,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +12: [2023-05-13 03:28:23,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +12: [2023-05-13 03:28:23,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +12: [2023-05-13 03:28:23,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +12: [2023-05-13 03:28:23,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +12: [2023-05-13 03:28:23,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +29: [2023-05-13 03:28:23,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +16: [2023-05-13 03:28:23,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +20: [2023-05-13 03:28:23,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +10: [2023-05-13 03:28:23,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +10: [2023-05-13 03:28:23,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +10: [2023-05-13 03:28:23,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +10: [2023-05-13 03:28:23,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +10: [2023-05-13 03:28:23,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +22: [2023-05-13 03:28:23,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 2: [2023-05-13 03:28:23,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 2: [2023-05-13 03:28:23,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 9: [2023-05-13 03:28:23,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +29: [2023-05-13 03:28:23,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +25: [2023-05-13 03:28:23,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +25: [2023-05-13 03:28:23,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +25: [2023-05-13 03:28:23,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 5: [2023-05-13 03:28:23,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 7: [2023-05-13 03:28:23,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +24: [2023-05-13 03:28:23,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +22: [2023-05-13 03:28:23,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 5: [2023-05-13 03:28:23,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 5: [2023-05-13 03:28:23,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 9: [2023-05-13 03:28:23,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 5: [2023-05-13 03:28:23,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +29: [2023-05-13 03:28:23,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +29: [2023-05-13 03:28:23,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +29: [2023-05-13 03:28:23,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +22: [2023-05-13 03:28:23,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +22: [2023-05-13 03:28:23,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +22: [2023-05-13 03:28:23,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +22: [2023-05-13 03:28:23,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 9: [2023-05-13 03:28:23,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 9: [2023-05-13 03:28:23,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 9: [2023-05-13 03:28:23,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 9: [2023-05-13 03:28:23,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +22: [2023-05-13 03:28:23,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +22: [2023-05-13 03:28:23,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +24: [2023-05-13 03:28:23,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +20: [2023-05-13 03:28:23,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +20: [2023-05-13 03:28:23,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 7: [2023-05-13 03:28:23,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +28: [2023-05-13 03:28:23,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +20: [2023-05-13 03:28:23,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +20: [2023-05-13 03:28:23,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +20: [2023-05-13 03:28:23,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +25: [2023-05-13 03:28:23,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +12: [2023-05-13 03:28:23,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +12: [2023-05-13 03:28:23,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +29: [2023-05-13 03:28:23,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 7: [2023-05-13 03:28:23,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +25: [2023-05-13 03:28:23,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +25: [2023-05-13 03:28:23,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +25: [2023-05-13 03:28:23,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +25: [2023-05-13 03:28:23,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +24: [2023-05-13 03:28:23,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 7: [2023-05-13 03:28:23,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +12: [2023-05-13 03:28:23,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +24: [2023-05-13 03:28:23,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 7: [2023-05-13 03:28:23,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +24: [2023-05-13 03:28:23,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +24: [2023-05-13 03:28:23,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +24: [2023-05-13 03:28:23,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +24: [2023-05-13 03:28:23,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 7: [2023-05-13 03:28:23,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:23,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +16: [2023-05-13 03:28:23,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +16: [2023-05-13 03:28:23,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... +10: [2023-05-13 03:28:23,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 7: [2023-05-13 03:28:23,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +16: [2023-05-13 03:28:23,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 7: [2023-05-13 03:28:23,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +28: [2023-05-13 03:28:23,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +28: [2023-05-13 03:28:23,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +28: [2023-05-13 03:28:23,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +28: [2023-05-13 03:28:23,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +28: [2023-05-13 03:28:23,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +28: [2023-05-13 03:28:23,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +28: [2023-05-13 03:28:23,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +16: [2023-05-13 03:28:23,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +22: [2023-05-13 03:28:23,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +16: [2023-05-13 03:28:23,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +16: [2023-05-13 03:28:23,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +12: [2023-05-13 03:28:23,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +25: [2023-05-13 03:28:23,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +12: [2023-05-13 03:28:23,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +16: [2023-05-13 03:28:23,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +16: [2023-05-13 03:28:23,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 2: [2023-05-13 03:28:23,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +25: [2023-05-13 03:28:23,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +29: [2023-05-13 03:28:23,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +10: [2023-05-13 03:28:23,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +25: [2023-05-13 03:28:23,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +10: [2023-05-13 03:28:23,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +29: [2023-05-13 03:28:23,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +12: [2023-05-13 03:28:23,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +12: [2023-05-13 03:28:23,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +12: [2023-05-13 03:28:23,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +24: [2023-05-13 03:28:23,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 5: [2023-05-13 03:28:23,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +10: [2023-05-13 03:28:23,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +10: [2023-05-13 03:28:23,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +10: [2023-05-13 03:28:23,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +22: [2023-05-13 03:28:23,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 2: [2023-05-13 03:28:23,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +29: [2023-05-13 03:28:23,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +29: [2023-05-13 03:28:23,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 2: [2023-05-13 03:28:23,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +29: [2023-05-13 03:28:23,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 2: [2023-05-13 03:28:23,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 2: [2023-05-13 03:28:23,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 2: [2023-05-13 03:28:23,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:23,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +17: [2023-05-13 03:28:23,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +17: [2023-05-13 03:28:23,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +25: [2023-05-13 03:28:23,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +24: [2023-05-13 03:28:23,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +25: [2023-05-13 03:28:23,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +22: [2023-05-13 03:28:23,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +22: [2023-05-13 03:28:23,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +22: [2023-05-13 03:28:23,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:23,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +24: [2023-05-13 03:28:23,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +25: [2023-05-13 03:28:23,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +22: [2023-05-13 03:28:23,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +25: [2023-05-13 03:28:23,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:23,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +17: [2023-05-13 03:28:23,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +17: [2023-05-13 03:28:23,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +25: [2023-05-13 03:28:23,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 9: [2023-05-13 03:28:23,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +24: [2023-05-13 03:28:23,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +24: [2023-05-13 03:28:23,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +24: [2023-05-13 03:28:23,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +24: [2023-05-13 03:28:23,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +20: [2023-05-13 03:28:23,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +20: [2023-05-13 03:28:23,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +20: [2023-05-13 03:28:23,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +20: [2023-05-13 03:28:23,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +20: [2023-05-13 03:28:23,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +20: [2023-05-13 03:28:23,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +20: [2023-05-13 03:28:23,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +20: [2023-05-13 03:28:23,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +28: [2023-05-13 03:28:23,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +28: [2023-05-13 03:28:23,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +28: [2023-05-13 03:28:23,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +28: [2023-05-13 03:28:23,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +28: [2023-05-13 03:28:23,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +28: [2023-05-13 03:28:23,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +28: [2023-05-13 03:28:23,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. +17: [2023-05-13 03:28:23,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:23,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:23,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:23,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:23,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:23,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:23,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_08-model_00-model_states.pt. + 3: [2023-05-13 03:28:23,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 3: [2023-05-13 03:28:23,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +30: [2023-05-13 03:28:24,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +15: [2023-05-13 03:28:24,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +30: [2023-05-13 03:28:24,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +30: [2023-05-13 03:28:24,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +30: [2023-05-13 03:28:24,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +30: [2023-05-13 03:28:24,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +30: [2023-05-13 03:28:24,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +30: [2023-05-13 03:28:24,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +30: [2023-05-13 03:28:24,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:24,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +15: [2023-05-13 03:28:24,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +15: [2023-05-13 03:28:24,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:24,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:24,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:24,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +15: [2023-05-13 03:28:24,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +15: [2023-05-13 03:28:24,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +15: [2023-05-13 03:28:24,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +15: [2023-05-13 03:28:24,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:24,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +15: [2023-05-13 03:28:24,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:24,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:24,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:24,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +27: [2023-05-13 03:28:24,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +27: [2023-05-13 03:28:24,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +27: [2023-05-13 03:28:24,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +27: [2023-05-13 03:28:24,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +27: [2023-05-13 03:28:24,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +27: [2023-05-13 03:28:24,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +27: [2023-05-13 03:28:24,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +27: [2023-05-13 03:28:24,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +18: [2023-05-13 03:28:24,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +18: [2023-05-13 03:28:24,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +18: [2023-05-13 03:28:24,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +18: [2023-05-13 03:28:24,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +18: [2023-05-13 03:28:24,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +18: [2023-05-13 03:28:24,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +18: [2023-05-13 03:28:24,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +18: [2023-05-13 03:28:24,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +15: [2023-05-13 03:28:24,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +30: [2023-05-13 03:28:24,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +30: [2023-05-13 03:28:24,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +27: [2023-05-13 03:28:24,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:24,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:24,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +30: [2023-05-13 03:28:24,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +18: [2023-05-13 03:28:24,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +30: [2023-05-13 03:28:24,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +18: [2023-05-13 03:28:24,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +18: [2023-05-13 03:28:24,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +30: [2023-05-13 03:28:24,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +30: [2023-05-13 03:28:24,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:24,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +30: [2023-05-13 03:28:24,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:24,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:24,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +30: [2023-05-13 03:28:24,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +18: [2023-05-13 03:28:24,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:24,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:24,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +18: [2023-05-13 03:28:24,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:24,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +15: [2023-05-13 03:28:24,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +18: [2023-05-13 03:28:24,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +15: [2023-05-13 03:28:24,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +15: [2023-05-13 03:28:24,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +18: [2023-05-13 03:28:24,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +18: [2023-05-13 03:28:24,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +15: [2023-05-13 03:28:24,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +15: [2023-05-13 03:28:24,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +27: [2023-05-13 03:28:24,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +15: [2023-05-13 03:28:24,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +27: [2023-05-13 03:28:24,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +15: [2023-05-13 03:28:24,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +27: [2023-05-13 03:28:24,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +27: [2023-05-13 03:28:24,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +27: [2023-05-13 03:28:24,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +27: [2023-05-13 03:28:24,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +27: [2023-05-13 03:28:24,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +15: [2023-05-13 03:28:24,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +27: [2023-05-13 03:28:24,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:24,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:24,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +30: [2023-05-13 03:28:24,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +30: [2023-05-13 03:28:24,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +30: [2023-05-13 03:28:24,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +18: [2023-05-13 03:28:24,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +18: [2023-05-13 03:28:24,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +18: [2023-05-13 03:28:24,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +30: [2023-05-13 03:28:24,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +18: [2023-05-13 03:28:24,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +30: [2023-05-13 03:28:24,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +30: [2023-05-13 03:28:24,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +30: [2023-05-13 03:28:24,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +30: [2023-05-13 03:28:24,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +18: [2023-05-13 03:28:24,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +18: [2023-05-13 03:28:24,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +18: [2023-05-13 03:28:24,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +18: [2023-05-13 03:28:24,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +15: [2023-05-13 03:28:24,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:24,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:24,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:24,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +27: [2023-05-13 03:28:24,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:24,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:24,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:24,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:24,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:24,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +15: [2023-05-13 03:28:24,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +15: [2023-05-13 03:28:24,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +15: [2023-05-13 03:28:24,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +30: [2023-05-13 03:28:24,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +30: [2023-05-13 03:28:24,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +15: [2023-05-13 03:28:24,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +15: [2023-05-13 03:28:24,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +15: [2023-05-13 03:28:24,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +15: [2023-05-13 03:28:24,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +18: [2023-05-13 03:28:24,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +18: [2023-05-13 03:28:24,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +27: [2023-05-13 03:28:24,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +27: [2023-05-13 03:28:24,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +18: [2023-05-13 03:28:24,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +30: [2023-05-13 03:28:24,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +30: [2023-05-13 03:28:24,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +18: [2023-05-13 03:28:24,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +18: [2023-05-13 03:28:24,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +27: [2023-05-13 03:28:24,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +27: [2023-05-13 03:28:24,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +27: [2023-05-13 03:28:24,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +27: [2023-05-13 03:28:24,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +27: [2023-05-13 03:28:24,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +30: [2023-05-13 03:28:24,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +18: [2023-05-13 03:28:24,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +30: [2023-05-13 03:28:24,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +30: [2023-05-13 03:28:24,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +30: [2023-05-13 03:28:24,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +18: [2023-05-13 03:28:24,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +18: [2023-05-13 03:28:24,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:24,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:24,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:24,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +27: [2023-05-13 03:28:24,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +27: [2023-05-13 03:28:24,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +15: [2023-05-13 03:28:24,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +15: [2023-05-13 03:28:24,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +15: [2023-05-13 03:28:24,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:24,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:24,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:24,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +15: [2023-05-13 03:28:24,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +15: [2023-05-13 03:28:24,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +15: [2023-05-13 03:28:24,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +15: [2023-05-13 03:28:24,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +31: [2023-05-13 03:28:24,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +26: [2023-05-13 03:28:24,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +26: [2023-05-13 03:28:24,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +26: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +31: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +31: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +31: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +31: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +31: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +31: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +14: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +26: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +26: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +26: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +31: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +14: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +14: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +26: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +14: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +27: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +14: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 5: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 5: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 5: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 5: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +14: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +28: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +10: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +10: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +14: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +26: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +29: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +29: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +29: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +29: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 5: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 5: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 5: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +22: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +22: [2023-05-13 03:28:24,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +29: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +29: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +29: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +14: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 2: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 2: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +10: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +24: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 5: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +22: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +22: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 6: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 6: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +24: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +10: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +10: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +10: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +10: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +28: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +28: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +28: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +17: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +24: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +24: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +29: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +24: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +24: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +28: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +28: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +28: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +10: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 6: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +24: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 2: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 2: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 2: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 2: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 2: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +22: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +22: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +22: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +11: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 6: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 6: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 6: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 6: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +12: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +12: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +12: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +12: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +12: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +12: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +12: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +28: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +24: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +22: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 2: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 6: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +17: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +17: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +17: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +17: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +17: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +12: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +17: [2023-05-13 03:28:24,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +11: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +11: [2023-05-13 03:28:24,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +11: [2023-05-13 03:28:24,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +11: [2023-05-13 03:28:24,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +11: [2023-05-13 03:28:24,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +11: [2023-05-13 03:28:24,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +17: [2023-05-13 03:28:24,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +11: [2023-05-13 03:28:24,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +27: [2023-05-13 03:28:24,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +27: [2023-05-13 03:28:24,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +27: [2023-05-13 03:28:24,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +27: [2023-05-13 03:28:24,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +31: [2023-05-13 03:28:24,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +31: [2023-05-13 03:28:24,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +28: [2023-05-13 03:28:24,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +10: [2023-05-13 03:28:24,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +29: [2023-05-13 03:28:24,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +26: [2023-05-13 03:28:24,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +10: [2023-05-13 03:28:24,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +29: [2023-05-13 03:28:24,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 8: [2023-05-13 03:28:24,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +14: [2023-05-13 03:28:24,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +26: [2023-05-13 03:28:24,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 8: [2023-05-13 03:28:24,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 6: [2023-05-13 03:28:24,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +26: [2023-05-13 03:28:24,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +11: [2023-05-13 03:28:24,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 2: [2023-05-13 03:28:24,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 5: [2023-05-13 03:28:24,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:24,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 2: [2023-05-13 03:28:24,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 5: [2023-05-13 03:28:24,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 5: [2023-05-13 03:28:24,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 5: [2023-05-13 03:28:24,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +22: [2023-05-13 03:28:24,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +14: [2023-05-13 03:28:24,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +22: [2023-05-13 03:28:24,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +10: [2023-05-13 03:28:24,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +14: [2023-05-13 03:28:24,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +12: [2023-05-13 03:28:24,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +12: [2023-05-13 03:28:24,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +12: [2023-05-13 03:28:24,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +12: [2023-05-13 03:28:24,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +12: [2023-05-13 03:28:24,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +24: [2023-05-13 03:28:24,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 5: [2023-05-13 03:28:24,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +12: [2023-05-13 03:28:24,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 5: [2023-05-13 03:28:24,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +12: [2023-05-13 03:28:24,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +24: [2023-05-13 03:28:24,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +24: [2023-05-13 03:28:24,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +14: [2023-05-13 03:28:24,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +24: [2023-05-13 03:28:24,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +14: [2023-05-13 03:28:24,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +26: [2023-05-13 03:28:24,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +14: [2023-05-13 03:28:24,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +12: [2023-05-13 03:28:24,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +26: [2023-05-13 03:28:24,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +24: [2023-05-13 03:28:24,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +14: [2023-05-13 03:28:24,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 5: [2023-05-13 03:28:24,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +24: [2023-05-13 03:28:24,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +22: [2023-05-13 03:28:24,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +10: [2023-05-13 03:28:24,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +10: [2023-05-13 03:28:24,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 5: [2023-05-13 03:28:24,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +14: [2023-05-13 03:28:24,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +10: [2023-05-13 03:28:24,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +24: [2023-05-13 03:28:24,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +10: [2023-05-13 03:28:24,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +29: [2023-05-13 03:28:24,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 2: [2023-05-13 03:28:24,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 8: [2023-05-13 03:28:24,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +26: [2023-05-13 03:28:24,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +24: [2023-05-13 03:28:24,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +22: [2023-05-13 03:28:24,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +31: [2023-05-13 03:28:24,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +10: [2023-05-13 03:28:24,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 2: [2023-05-13 03:28:24,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +26: [2023-05-13 03:28:24,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +31: [2023-05-13 03:28:24,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +29: [2023-05-13 03:28:24,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 2: [2023-05-13 03:28:24,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +22: [2023-05-13 03:28:24,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +31: [2023-05-13 03:28:24,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 8: [2023-05-13 03:28:24,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +22: [2023-05-13 03:28:24,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 8: [2023-05-13 03:28:24,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +22: [2023-05-13 03:28:24,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +26: [2023-05-13 03:28:24,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +29: [2023-05-13 03:28:24,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +31: [2023-05-13 03:28:24,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +29: [2023-05-13 03:28:24,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +22: [2023-05-13 03:28:24,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 6: [2023-05-13 03:28:24,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 2: [2023-05-13 03:28:24,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +29: [2023-05-13 03:28:24,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +28: [2023-05-13 03:28:24,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 2: [2023-05-13 03:28:24,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +29: [2023-05-13 03:28:24,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 8: [2023-05-13 03:28:24,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 6: [2023-05-13 03:28:24,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +28: [2023-05-13 03:28:24,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 2: [2023-05-13 03:28:24,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 8: [2023-05-13 03:28:24,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +31: [2023-05-13 03:28:24,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +28: [2023-05-13 03:28:24,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 6: [2023-05-13 03:28:24,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:24,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +31: [2023-05-13 03:28:24,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 8: [2023-05-13 03:28:24,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +11: [2023-05-13 03:28:24,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +28: [2023-05-13 03:28:24,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +11: [2023-05-13 03:28:24,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:24,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 6: [2023-05-13 03:28:24,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +11: [2023-05-13 03:28:24,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 6: [2023-05-13 03:28:24,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:24,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 6: [2023-05-13 03:28:24,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:24,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +28: [2023-05-13 03:28:24,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +11: [2023-05-13 03:28:24,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:24,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +28: [2023-05-13 03:28:24,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +28: [2023-05-13 03:28:24,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +11: [2023-05-13 03:28:24,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 6: [2023-05-13 03:28:24,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +11: [2023-05-13 03:28:24,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +11: [2023-05-13 03:28:24,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:24,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:24,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +14: [2023-05-13 03:28:24,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +28: [2023-05-13 03:28:24,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +31: [2023-05-13 03:28:24,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +31: [2023-05-13 03:28:24,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +11: [2023-05-13 03:28:24,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +10: [2023-05-13 03:28:24,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +10: [2023-05-13 03:28:24,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +17: [2023-05-13 03:28:24,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +29: [2023-05-13 03:28:24,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +29: [2023-05-13 03:28:24,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +26: [2023-05-13 03:28:24,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +26: [2023-05-13 03:28:24,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +26: [2023-05-13 03:28:24,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 2: [2023-05-13 03:28:24,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 2: [2023-05-13 03:28:24,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 6: [2023-05-13 03:28:24,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +12: [2023-05-13 03:28:24,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +12: [2023-05-13 03:28:24,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +22: [2023-05-13 03:28:24,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +22: [2023-05-13 03:28:24,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +14: [2023-05-13 03:28:24,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +24: [2023-05-13 03:28:24,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +24: [2023-05-13 03:28:24,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 5: [2023-05-13 03:28:24,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 5: [2023-05-13 03:28:24,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 5: [2023-05-13 03:28:24,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 5: [2023-05-13 03:28:24,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +10: [2023-05-13 03:28:24,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +12: [2023-05-13 03:28:24,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +14: [2023-05-13 03:28:24,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +24: [2023-05-13 03:28:24,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 5: [2023-05-13 03:28:24,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 5: [2023-05-13 03:28:24,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 5: [2023-05-13 03:28:24,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 5: [2023-05-13 03:28:24,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +14: [2023-05-13 03:28:24,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +24: [2023-05-13 03:28:24,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +26: [2023-05-13 03:28:24,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +26: [2023-05-13 03:28:24,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +26: [2023-05-13 03:28:24,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +14: [2023-05-13 03:28:24,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +29: [2023-05-13 03:28:24,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +28: [2023-05-13 03:28:24,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:24,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +12: [2023-05-13 03:28:24,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +12: [2023-05-13 03:28:24,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +26: [2023-05-13 03:28:24,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +26: [2023-05-13 03:28:24,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +12: [2023-05-13 03:28:24,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +12: [2023-05-13 03:28:24,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +11: [2023-05-13 03:28:24,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +22: [2023-05-13 03:28:24,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +14: [2023-05-13 03:28:24,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +14: [2023-05-13 03:28:24,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +14: [2023-05-13 03:28:24,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +14: [2023-05-13 03:28:24,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +10: [2023-05-13 03:28:24,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +31: [2023-05-13 03:28:24,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +24: [2023-05-13 03:28:24,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +24: [2023-05-13 03:28:24,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +24: [2023-05-13 03:28:24,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +24: [2023-05-13 03:28:24,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +17: [2023-05-13 03:28:24,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +31: [2023-05-13 03:28:24,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 8: [2023-05-13 03:28:24,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +10: [2023-05-13 03:28:24,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +31: [2023-05-13 03:28:24,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +29: [2023-05-13 03:28:24,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +29: [2023-05-13 03:28:24,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +29: [2023-05-13 03:28:24,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +26: [2023-05-13 03:28:24,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 8: [2023-05-13 03:28:24,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +22: [2023-05-13 03:28:24,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +31: [2023-05-13 03:28:24,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +31: [2023-05-13 03:28:24,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +31: [2023-05-13 03:28:24,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 2: [2023-05-13 03:28:24,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:24,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 6: [2023-05-13 03:28:24,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 2: [2023-05-13 03:28:24,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 2: [2023-05-13 03:28:24,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 2: [2023-05-13 03:28:24,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 2: [2023-05-13 03:28:24,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 2: [2023-05-13 03:28:24,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:24,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +26: [2023-05-13 03:28:24,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 2: [2023-05-13 03:28:24,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 2: [2023-05-13 03:28:24,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +26: [2023-05-13 03:28:24,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 6: [2023-05-13 03:28:24,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +28: [2023-05-13 03:28:24,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +28: [2023-05-13 03:28:24,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +28: [2023-05-13 03:28:24,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 6: [2023-05-13 03:28:24,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +10: [2023-05-13 03:28:24,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +11: [2023-05-13 03:28:24,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +11: [2023-05-13 03:28:24,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +11: [2023-05-13 03:28:24,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 5: [2023-05-13 03:28:24,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +22: [2023-05-13 03:28:24,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +22: [2023-05-13 03:28:24,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +22: [2023-05-13 03:28:24,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +22: [2023-05-13 03:28:24,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 5: [2023-05-13 03:28:24,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +24: [2023-05-13 03:28:24,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +22: [2023-05-13 03:28:24,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +22: [2023-05-13 03:28:24,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 5: [2023-05-13 03:28:24,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +28: [2023-05-13 03:28:24,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +28: [2023-05-13 03:28:24,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +28: [2023-05-13 03:28:24,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +28: [2023-05-13 03:28:24,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +10: [2023-05-13 03:28:24,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +10: [2023-05-13 03:28:24,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +10: [2023-05-13 03:28:24,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +10: [2023-05-13 03:28:24,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +10: [2023-05-13 03:28:24,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +29: [2023-05-13 03:28:24,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +29: [2023-05-13 03:28:24,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +29: [2023-05-13 03:28:24,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +29: [2023-05-13 03:28:24,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +17: [2023-05-13 03:28:24,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +17: [2023-05-13 03:28:24,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +17: [2023-05-13 03:28:24,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 5: [2023-05-13 03:28:24,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:24,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +11: [2023-05-13 03:28:24,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +11: [2023-05-13 03:28:24,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +11: [2023-05-13 03:28:24,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +11: [2023-05-13 03:28:24,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +24: [2023-05-13 03:28:24,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +17: [2023-05-13 03:28:24,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 6: [2023-05-13 03:28:24,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 6: [2023-05-13 03:28:24,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 6: [2023-05-13 03:28:24,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 6: [2023-05-13 03:28:24,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 6: [2023-05-13 03:28:24,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +17: [2023-05-13 03:28:24,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +17: [2023-05-13 03:28:24,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +17: [2023-05-13 03:28:24,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +24: [2023-05-13 03:28:24,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 5: [2023-05-13 03:28:24,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +29: [2023-05-13 03:28:24,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +14: [2023-05-13 03:28:24,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 5: [2023-05-13 03:28:24,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +14: [2023-05-13 03:28:24,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +24: [2023-05-13 03:28:24,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +26: [2023-05-13 03:28:24,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 5: [2023-05-13 03:28:24,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +26: [2023-05-13 03:28:24,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +26: [2023-05-13 03:28:24,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +22: [2023-05-13 03:28:24,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 5: [2023-05-13 03:28:24,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +14: [2023-05-13 03:28:24,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +14: [2023-05-13 03:28:24,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +24: [2023-05-13 03:28:24,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +24: [2023-05-13 03:28:24,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:24,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:24,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:24,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +26: [2023-05-13 03:28:24,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +26: [2023-05-13 03:28:24,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +14: [2023-05-13 03:28:24,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +24: [2023-05-13 03:28:24,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +14: [2023-05-13 03:28:24,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +14: [2023-05-13 03:28:24,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +24: [2023-05-13 03:28:24,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +29: [2023-05-13 03:28:24,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:24,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:24,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +22: [2023-05-13 03:28:24,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 6: [2023-05-13 03:28:24,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +10: [2023-05-13 03:28:24,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 6: [2023-05-13 03:28:24,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +22: [2023-05-13 03:28:24,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 2: [2023-05-13 03:28:24,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 2: [2023-05-13 03:28:24,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 2: [2023-05-13 03:28:24,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +10: [2023-05-13 03:28:24,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +22: [2023-05-13 03:28:24,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +22: [2023-05-13 03:28:24,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 2: [2023-05-13 03:28:24,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 2: [2023-05-13 03:28:24,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 2: [2023-05-13 03:28:24,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +29: [2023-05-13 03:28:24,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +22: [2023-05-13 03:28:24,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +10: [2023-05-13 03:28:24,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +10: [2023-05-13 03:28:24,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +10: [2023-05-13 03:28:24,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +11: [2023-05-13 03:28:24,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +29: [2023-05-13 03:28:24,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +29: [2023-05-13 03:28:24,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +17: [2023-05-13 03:28:24,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +11: [2023-05-13 03:28:24,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +11: [2023-05-13 03:28:24,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +31: [2023-05-13 03:28:24,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +31: [2023-05-13 03:28:24,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +31: [2023-05-13 03:28:24,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +31: [2023-05-13 03:28:24,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +29: [2023-05-13 03:28:24,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +31: [2023-05-13 03:28:24,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +31: [2023-05-13 03:28:24,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +31: [2023-05-13 03:28:24,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +31: [2023-05-13 03:28:24,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 8: [2023-05-13 03:28:24,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 8: [2023-05-13 03:28:24,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 8: [2023-05-13 03:28:24,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 8: [2023-05-13 03:28:24,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 8: [2023-05-13 03:28:24,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 8: [2023-05-13 03:28:24,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +17: [2023-05-13 03:28:24,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +17: [2023-05-13 03:28:24,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +17: [2023-05-13 03:28:24,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 6: [2023-05-13 03:28:24,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +11: [2023-05-13 03:28:24,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 6: [2023-05-13 03:28:24,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +17: [2023-05-13 03:28:24,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +17: [2023-05-13 03:28:24,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +11: [2023-05-13 03:28:24,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +11: [2023-05-13 03:28:24,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +17: [2023-05-13 03:28:24,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 6: [2023-05-13 03:28:24,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 6: [2023-05-13 03:28:24,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +11: [2023-05-13 03:28:24,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +28: [2023-05-13 03:28:24,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +28: [2023-05-13 03:28:24,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +28: [2023-05-13 03:28:24,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 6: [2023-05-13 03:28:24,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +28: [2023-05-13 03:28:24,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +28: [2023-05-13 03:28:24,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +28: [2023-05-13 03:28:24,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +28: [2023-05-13 03:28:24,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 9: [2023-05-13 03:28:24,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 9: [2023-05-13 03:28:24,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 9: [2023-05-13 03:28:24,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +13: [2023-05-13 03:28:24,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +13: [2023-05-13 03:28:24,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 7: [2023-05-13 03:28:24,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 7: [2023-05-13 03:28:24,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 7: [2023-05-13 03:28:24,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 7: [2023-05-13 03:28:24,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 7: [2023-05-13 03:28:24,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +13: [2023-05-13 03:28:24,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +13: [2023-05-13 03:28:24,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +13: [2023-05-13 03:28:24,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +13: [2023-05-13 03:28:24,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +13: [2023-05-13 03:28:24,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 7: [2023-05-13 03:28:24,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 7: [2023-05-13 03:28:24,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 7: [2023-05-13 03:28:24,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 9: [2023-05-13 03:28:24,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 9: [2023-05-13 03:28:24,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 9: [2023-05-13 03:28:24,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 9: [2023-05-13 03:28:24,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 9: [2023-05-13 03:28:24,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +13: [2023-05-13 03:28:24,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:24,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +23: [2023-05-13 03:28:24,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 9: [2023-05-13 03:28:24,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:24,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 7: [2023-05-13 03:28:24,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:24,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +23: [2023-05-13 03:28:24,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +23: [2023-05-13 03:28:24,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +23: [2023-05-13 03:28:24,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +23: [2023-05-13 03:28:24,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +13: [2023-05-13 03:28:24,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 7: [2023-05-13 03:28:24,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 7: [2023-05-13 03:28:24,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +13: [2023-05-13 03:28:24,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +13: [2023-05-13 03:28:24,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +13: [2023-05-13 03:28:24,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +13: [2023-05-13 03:28:24,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +13: [2023-05-13 03:28:24,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 7: [2023-05-13 03:28:24,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:24,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 7: [2023-05-13 03:28:24,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +13: [2023-05-13 03:28:24,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +13: [2023-05-13 03:28:24,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:24,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 7: [2023-05-13 03:28:24,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 7: [2023-05-13 03:28:24,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 7: [2023-05-13 03:28:24,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:24,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 9: [2023-05-13 03:28:24,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 9: [2023-05-13 03:28:24,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 9: [2023-05-13 03:28:24,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 9: [2023-05-13 03:28:24,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 9: [2023-05-13 03:28:24,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 9: [2023-05-13 03:28:24,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 9: [2023-05-13 03:28:24,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:24,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:24,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:24,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:24,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:24,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 7: [2023-05-13 03:28:24,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 9: [2023-05-13 03:28:24,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +13: [2023-05-13 03:28:24,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +13: [2023-05-13 03:28:24,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +13: [2023-05-13 03:28:24,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +13: [2023-05-13 03:28:24,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 7: [2023-05-13 03:28:24,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 7: [2023-05-13 03:28:24,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:24,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +23: [2023-05-13 03:28:24,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +13: [2023-05-13 03:28:24,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 7: [2023-05-13 03:28:24,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 7: [2023-05-13 03:28:24,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 7: [2023-05-13 03:28:24,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 7: [2023-05-13 03:28:24,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 7: [2023-05-13 03:28:24,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 7: [2023-05-13 03:28:24,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +13: [2023-05-13 03:28:24,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +13: [2023-05-13 03:28:24,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +27: [2023-05-13 03:28:24,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +13: [2023-05-13 03:28:24,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +27: [2023-05-13 03:28:24,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +27: [2023-05-13 03:28:24,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +27: [2023-05-13 03:28:24,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +27: [2023-05-13 03:28:24,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +27: [2023-05-13 03:28:24,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +27: [2023-05-13 03:28:24,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +27: [2023-05-13 03:28:24,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 9: [2023-05-13 03:28:24,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +27: [2023-05-13 03:28:24,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +11: [2023-05-13 03:28:24,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +11: [2023-05-13 03:28:24,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +11: [2023-05-13 03:28:24,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +11: [2023-05-13 03:28:24,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +23: [2023-05-13 03:28:24,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +11: [2023-05-13 03:28:24,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +11: [2023-05-13 03:28:24,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +11: [2023-05-13 03:28:24,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +11: [2023-05-13 03:28:24,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:24,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +23: [2023-05-13 03:28:24,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +23: [2023-05-13 03:28:24,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:24,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +23: [2023-05-13 03:28:24,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 9: [2023-05-13 03:28:24,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 9: [2023-05-13 03:28:24,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 9: [2023-05-13 03:28:24,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 9: [2023-05-13 03:28:24,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 9: [2023-05-13 03:28:24,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 9: [2023-05-13 03:28:24,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 9: [2023-05-13 03:28:24,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +11: [2023-05-13 03:28:24,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:24,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 7: [2023-05-13 03:28:24,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +27: [2023-05-13 03:28:24,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +27: [2023-05-13 03:28:24,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:24,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +27: [2023-05-13 03:28:24,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +13: [2023-05-13 03:28:24,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +27: [2023-05-13 03:28:24,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +27: [2023-05-13 03:28:24,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +27: [2023-05-13 03:28:24,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +27: [2023-05-13 03:28:24,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 7: [2023-05-13 03:28:24,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +13: [2023-05-13 03:28:24,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +13: [2023-05-13 03:28:24,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +13: [2023-05-13 03:28:24,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +11: [2023-05-13 03:28:24,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +11: [2023-05-13 03:28:24,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +11: [2023-05-13 03:28:24,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +11: [2023-05-13 03:28:24,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +11: [2023-05-13 03:28:24,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +11: [2023-05-13 03:28:24,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +11: [2023-05-13 03:28:24,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +13: [2023-05-13 03:28:24,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:24,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +12: [2023-05-13 03:28:24,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +12: [2023-05-13 03:28:24,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +12: [2023-05-13 03:28:24,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +12: [2023-05-13 03:28:24,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +12: [2023-05-13 03:28:24,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +12: [2023-05-13 03:28:24,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +12: [2023-05-13 03:28:24,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +13: [2023-05-13 03:28:24,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 7: [2023-05-13 03:28:24,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 7: [2023-05-13 03:28:24,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +13: [2023-05-13 03:28:24,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +13: [2023-05-13 03:28:24,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +15: [2023-05-13 03:28:24,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 7: [2023-05-13 03:28:24,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 7: [2023-05-13 03:28:24,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 7: [2023-05-13 03:28:24,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +15: [2023-05-13 03:28:24,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +15: [2023-05-13 03:28:24,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +15: [2023-05-13 03:28:24,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +15: [2023-05-13 03:28:24,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +15: [2023-05-13 03:28:24,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +15: [2023-05-13 03:28:24,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +15: [2023-05-13 03:28:24,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +12: [2023-05-13 03:28:24,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:24,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:24,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:24,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:24,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:24,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:24,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:24,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +15: [2023-05-13 03:28:24,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:24,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +15: [2023-05-13 03:28:24,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:24,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +15: [2023-05-13 03:28:24,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:24,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +15: [2023-05-13 03:28:24,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:24,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +30: [2023-05-13 03:28:24,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +30: [2023-05-13 03:28:24,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +30: [2023-05-13 03:28:24,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +30: [2023-05-13 03:28:24,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +30: [2023-05-13 03:28:24,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +30: [2023-05-13 03:28:24,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +30: [2023-05-13 03:28:24,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +23: [2023-05-13 03:28:24,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +30: [2023-05-13 03:28:24,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +23: [2023-05-13 03:28:24,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +15: [2023-05-13 03:28:24,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +15: [2023-05-13 03:28:24,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +15: [2023-05-13 03:28:24,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +15: [2023-05-13 03:28:24,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +30: [2023-05-13 03:28:24,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 9: [2023-05-13 03:28:24,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 9: [2023-05-13 03:28:24,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +28: [2023-05-13 03:28:24,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +30: [2023-05-13 03:28:24,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +30: [2023-05-13 03:28:24,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +28: [2023-05-13 03:28:24,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +28: [2023-05-13 03:28:24,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +28: [2023-05-13 03:28:24,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +28: [2023-05-13 03:28:24,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +28: [2023-05-13 03:28:24,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +28: [2023-05-13 03:28:24,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +28: [2023-05-13 03:28:24,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +30: [2023-05-13 03:28:24,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +30: [2023-05-13 03:28:24,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +30: [2023-05-13 03:28:24,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +30: [2023-05-13 03:28:24,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +30: [2023-05-13 03:28:24,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 9: [2023-05-13 03:28:24,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 9: [2023-05-13 03:28:24,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +28: [2023-05-13 03:28:24,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 9: [2023-05-13 03:28:24,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 9: [2023-05-13 03:28:24,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +27: [2023-05-13 03:28:24,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 9: [2023-05-13 03:28:24,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +11: [2023-05-13 03:28:24,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +14: [2023-05-13 03:28:24,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +14: [2023-05-13 03:28:24,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +28: [2023-05-13 03:28:24,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +28: [2023-05-13 03:28:24,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +28: [2023-05-13 03:28:24,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +28: [2023-05-13 03:28:24,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +14: [2023-05-13 03:28:24,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +14: [2023-05-13 03:28:24,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +14: [2023-05-13 03:28:24,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +14: [2023-05-13 03:28:24,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +14: [2023-05-13 03:28:24,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +14: [2023-05-13 03:28:24,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +28: [2023-05-13 03:28:24,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +28: [2023-05-13 03:28:24,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +28: [2023-05-13 03:28:24,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +14: [2023-05-13 03:28:24,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +14: [2023-05-13 03:28:24,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +14: [2023-05-13 03:28:24,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +14: [2023-05-13 03:28:24,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +14: [2023-05-13 03:28:24,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +14: [2023-05-13 03:28:24,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +14: [2023-05-13 03:28:24,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +14: [2023-05-13 03:28:24,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +26: [2023-05-13 03:28:24,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +26: [2023-05-13 03:28:24,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +27: [2023-05-13 03:28:24,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +18: [2023-05-13 03:28:24,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +18: [2023-05-13 03:28:24,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +18: [2023-05-13 03:28:24,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +11: [2023-05-13 03:28:24,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +31: [2023-05-13 03:28:24,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +31: [2023-05-13 03:28:24,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +26: [2023-05-13 03:28:24,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +26: [2023-05-13 03:28:24,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +26: [2023-05-13 03:28:24,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +26: [2023-05-13 03:28:24,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +26: [2023-05-13 03:28:24,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +26: [2023-05-13 03:28:24,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +26: [2023-05-13 03:28:24,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +26: [2023-05-13 03:28:24,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +18: [2023-05-13 03:28:24,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +18: [2023-05-13 03:28:24,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +18: [2023-05-13 03:28:24,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +18: [2023-05-13 03:28:24,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +18: [2023-05-13 03:28:24,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +31: [2023-05-13 03:28:24,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +31: [2023-05-13 03:28:24,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +31: [2023-05-13 03:28:24,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +31: [2023-05-13 03:28:24,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +31: [2023-05-13 03:28:24,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +31: [2023-05-13 03:28:24,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +31: [2023-05-13 03:28:24,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +18: [2023-05-13 03:28:24,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +31: [2023-05-13 03:28:24,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +18: [2023-05-13 03:28:24,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +18: [2023-05-13 03:28:24,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +26: [2023-05-13 03:28:24,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +15: [2023-05-13 03:28:24,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +27: [2023-05-13 03:28:24,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +27: [2023-05-13 03:28:24,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +12: [2023-05-13 03:28:24,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +12: [2023-05-13 03:28:24,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +26: [2023-05-13 03:28:24,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +26: [2023-05-13 03:28:24,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:24,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +18: [2023-05-13 03:28:24,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +26: [2023-05-13 03:28:24,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +18: [2023-05-13 03:28:24,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +26: [2023-05-13 03:28:24,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +18: [2023-05-13 03:28:24,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +11: [2023-05-13 03:28:24,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +11: [2023-05-13 03:28:24,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +11: [2023-05-13 03:28:24,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +26: [2023-05-13 03:28:24,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +18: [2023-05-13 03:28:24,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +18: [2023-05-13 03:28:24,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +10: [2023-05-13 03:28:24,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +10: [2023-05-13 03:28:24,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +10: [2023-05-13 03:28:24,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +10: [2023-05-13 03:28:24,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +10: [2023-05-13 03:28:24,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +10: [2023-05-13 03:28:24,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +10: [2023-05-13 03:28:24,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +10: [2023-05-13 03:28:24,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +31: [2023-05-13 03:28:24,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +31: [2023-05-13 03:28:24,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +31: [2023-05-13 03:28:24,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +31: [2023-05-13 03:28:24,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +11: [2023-05-13 03:28:24,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +11: [2023-05-13 03:28:24,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +11: [2023-05-13 03:28:24,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +11: [2023-05-13 03:28:24,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +27: [2023-05-13 03:28:24,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +27: [2023-05-13 03:28:24,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +27: [2023-05-13 03:28:24,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +27: [2023-05-13 03:28:24,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +27: [2023-05-13 03:28:24,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +31: [2023-05-13 03:28:24,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +31: [2023-05-13 03:28:24,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 8: [2023-05-13 03:28:24,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +10: [2023-05-13 03:28:24,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +10: [2023-05-13 03:28:24,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +30: [2023-05-13 03:28:24,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +12: [2023-05-13 03:28:24,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +12: [2023-05-13 03:28:24,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +12: [2023-05-13 03:28:24,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +12: [2023-05-13 03:28:24,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +12: [2023-05-13 03:28:24,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 8: [2023-05-13 03:28:24,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +10: [2023-05-13 03:28:24,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +10: [2023-05-13 03:28:24,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +10: [2023-05-13 03:28:24,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +10: [2023-05-13 03:28:24,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +10: [2023-05-13 03:28:24,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +10: [2023-05-13 03:28:24,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +30: [2023-05-13 03:28:24,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +30: [2023-05-13 03:28:24,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +28: [2023-05-13 03:28:24,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +15: [2023-05-13 03:28:24,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +15: [2023-05-13 03:28:24,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:24,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 8: [2023-05-13 03:28:24,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 8: [2023-05-13 03:28:24,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +30: [2023-05-13 03:28:24,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 8: [2023-05-13 03:28:24,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 8: [2023-05-13 03:28:24,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 8: [2023-05-13 03:28:24,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +27: [2023-05-13 03:28:24,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +12: [2023-05-13 03:28:24,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +27: [2023-05-13 03:28:24,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +12: [2023-05-13 03:28:24,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +30: [2023-05-13 03:28:24,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +11: [2023-05-13 03:28:24,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +11: [2023-05-13 03:28:24,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +11: [2023-05-13 03:28:24,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +30: [2023-05-13 03:28:24,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +30: [2023-05-13 03:28:24,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +30: [2023-05-13 03:28:24,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +30: [2023-05-13 03:28:24,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +14: [2023-05-13 03:28:24,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +15: [2023-05-13 03:28:24,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +15: [2023-05-13 03:28:24,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +15: [2023-05-13 03:28:24,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +14: [2023-05-13 03:28:24,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +28: [2023-05-13 03:28:24,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +15: [2023-05-13 03:28:24,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +15: [2023-05-13 03:28:24,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +15: [2023-05-13 03:28:24,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +14: [2023-05-13 03:28:24,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 0: [2023-05-13 03:28:24,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +30: [2023-05-13 03:28:24,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +11: [2023-05-13 03:28:24,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +11: [2023-05-13 03:28:24,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +30: [2023-05-13 03:28:24,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +11: [2023-05-13 03:28:24,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +12: [2023-05-13 03:28:24,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +15: [2023-05-13 03:28:24,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +11: [2023-05-13 03:28:24,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +12: [2023-05-13 03:28:24,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +14: [2023-05-13 03:28:24,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +27: [2023-05-13 03:28:24,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +12: [2023-05-13 03:28:24,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +27: [2023-05-13 03:28:24,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 0: [2023-05-13 03:28:24,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +27: [2023-05-13 03:28:24,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +27: [2023-05-13 03:28:24,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +27: [2023-05-13 03:28:24,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +12: [2023-05-13 03:28:24,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +12: [2023-05-13 03:28:24,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +17: [2023-05-13 03:28:24,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +17: [2023-05-13 03:28:24,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +17: [2023-05-13 03:28:24,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +17: [2023-05-13 03:28:24,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +17: [2023-05-13 03:28:24,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +17: [2023-05-13 03:28:24,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +17: [2023-05-13 03:28:24,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +17: [2023-05-13 03:28:24,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +26: [2023-05-13 03:28:24,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +26: [2023-05-13 03:28:24,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +31: [2023-05-13 03:28:24,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +31: [2023-05-13 03:28:24,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +30: [2023-05-13 03:28:24,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +26: [2023-05-13 03:28:24,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +17: [2023-05-13 03:28:24,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +28: [2023-05-13 03:28:24,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +28: [2023-05-13 03:28:25,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +14: [2023-05-13 03:28:25,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +28: [2023-05-13 03:28:25,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +28: [2023-05-13 03:28:25,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +28: [2023-05-13 03:28:25,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +28: [2023-05-13 03:28:25,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +28: [2023-05-13 03:28:25,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +18: [2023-05-13 03:28:25,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +18: [2023-05-13 03:28:25,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +18: [2023-05-13 03:28:25,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +17: [2023-05-13 03:28:25,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +14: [2023-05-13 03:28:25,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +14: [2023-05-13 03:28:25,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +14: [2023-05-13 03:28:25,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +14: [2023-05-13 03:28:25,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +18: [2023-05-13 03:28:25,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +17: [2023-05-13 03:28:25,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +30: [2023-05-13 03:28:25,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +17: [2023-05-13 03:28:25,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +17: [2023-05-13 03:28:25,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +14: [2023-05-13 03:28:25,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +17: [2023-05-13 03:28:25,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +10: [2023-05-13 03:28:25,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +17: [2023-05-13 03:28:25,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +17: [2023-05-13 03:28:25,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +30: [2023-05-13 03:28:25,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +30: [2023-05-13 03:28:25,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +10: [2023-05-13 03:28:25,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +30: [2023-05-13 03:28:25,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +15: [2023-05-13 03:28:25,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +18: [2023-05-13 03:28:25,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +26: [2023-05-13 03:28:25,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +26: [2023-05-13 03:28:25,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +26: [2023-05-13 03:28:25,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +14: [2023-05-13 03:28:25,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +14: [2023-05-13 03:28:25,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +15: [2023-05-13 03:28:25,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +26: [2023-05-13 03:28:25,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +26: [2023-05-13 03:28:25,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +15: [2023-05-13 03:28:25,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +15: [2023-05-13 03:28:25,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +31: [2023-05-13 03:28:25,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +31: [2023-05-13 03:28:25,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +15: [2023-05-13 03:28:25,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +29: [2023-05-13 03:28:25,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +29: [2023-05-13 03:28:25,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +15: [2023-05-13 03:28:25,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +29: [2023-05-13 03:28:25,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +29: [2023-05-13 03:28:25,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +29: [2023-05-13 03:28:25,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +29: [2023-05-13 03:28:25,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +29: [2023-05-13 03:28:25,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +29: [2023-05-13 03:28:25,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +26: [2023-05-13 03:28:25,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +26: [2023-05-13 03:28:25,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +18: [2023-05-13 03:28:25,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +18: [2023-05-13 03:28:25,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +18: [2023-05-13 03:28:25,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +31: [2023-05-13 03:28:25,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +31: [2023-05-13 03:28:25,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +31: [2023-05-13 03:28:25,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +29: [2023-05-13 03:28:25,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +29: [2023-05-13 03:28:25,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +26: [2023-05-13 03:28:25,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +22: [2023-05-13 03:28:25,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +22: [2023-05-13 03:28:25,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +22: [2023-05-13 03:28:25,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +22: [2023-05-13 03:28:25,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +22: [2023-05-13 03:28:25,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +22: [2023-05-13 03:28:25,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +22: [2023-05-13 03:28:25,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +18: [2023-05-13 03:28:25,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +22: [2023-05-13 03:28:25,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +14: [2023-05-13 03:28:25,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +31: [2023-05-13 03:28:25,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +31: [2023-05-13 03:28:25,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +31: [2023-05-13 03:28:25,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +18: [2023-05-13 03:28:25,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +18: [2023-05-13 03:28:25,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +10: [2023-05-13 03:28:25,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +10: [2023-05-13 03:28:25,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +10: [2023-05-13 03:28:25,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +18: [2023-05-13 03:28:25,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +29: [2023-05-13 03:28:25,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +29: [2023-05-13 03:28:25,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +22: [2023-05-13 03:28:25,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +29: [2023-05-13 03:28:25,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +29: [2023-05-13 03:28:25,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +22: [2023-05-13 03:28:25,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +28: [2023-05-13 03:28:25,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +28: [2023-05-13 03:28:25,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +29: [2023-05-13 03:28:25,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +29: [2023-05-13 03:28:25,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +10: [2023-05-13 03:28:25,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +10: [2023-05-13 03:28:25,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +10: [2023-05-13 03:28:25,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +10: [2023-05-13 03:28:25,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +10: [2023-05-13 03:28:25,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +14: [2023-05-13 03:28:25,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +14: [2023-05-13 03:28:25,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +14: [2023-05-13 03:28:25,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +28: [2023-05-13 03:28:25,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +18: [2023-05-13 03:28:25,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +28: [2023-05-13 03:28:25,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +28: [2023-05-13 03:28:25,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +22: [2023-05-13 03:28:25,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +22: [2023-05-13 03:28:25,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +22: [2023-05-13 03:28:25,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +22: [2023-05-13 03:28:25,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +28: [2023-05-13 03:28:25,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +28: [2023-05-13 03:28:25,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +22: [2023-05-13 03:28:25,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +26: [2023-05-13 03:28:25,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +22: [2023-05-13 03:28:25,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +17: [2023-05-13 03:28:25,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +26: [2023-05-13 03:28:25,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +26: [2023-05-13 03:28:25,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +18: [2023-05-13 03:28:25,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +26: [2023-05-13 03:28:25,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +26: [2023-05-13 03:28:25,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +18: [2023-05-13 03:28:25,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +18: [2023-05-13 03:28:25,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +10: [2023-05-13 03:28:25,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +31: [2023-05-13 03:28:25,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +31: [2023-05-13 03:28:25,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +24: [2023-05-13 03:28:25,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +24: [2023-05-13 03:28:25,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +24: [2023-05-13 03:28:25,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +24: [2023-05-13 03:28:25,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +24: [2023-05-13 03:28:25,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +24: [2023-05-13 03:28:25,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +24: [2023-05-13 03:28:25,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +24: [2023-05-13 03:28:25,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +31: [2023-05-13 03:28:25,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +31: [2023-05-13 03:28:25,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +24: [2023-05-13 03:28:25,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +24: [2023-05-13 03:28:25,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +31: [2023-05-13 03:28:25,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +24: [2023-05-13 03:28:25,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +31: [2023-05-13 03:28:25,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +24: [2023-05-13 03:28:25,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +24: [2023-05-13 03:28:25,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +24: [2023-05-13 03:28:25,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +17: [2023-05-13 03:28:25,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +24: [2023-05-13 03:28:25,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +24: [2023-05-13 03:28:25,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +10: [2023-05-13 03:28:25,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +10: [2023-05-13 03:28:25,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +10: [2023-05-13 03:28:25,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +10: [2023-05-13 03:28:25,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +10: [2023-05-13 03:28:25,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +17: [2023-05-13 03:28:25,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +29: [2023-05-13 03:28:25,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +29: [2023-05-13 03:28:25,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +17: [2023-05-13 03:28:25,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +17: [2023-05-13 03:28:25,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +17: [2023-05-13 03:28:25,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +17: [2023-05-13 03:28:25,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +22: [2023-05-13 03:28:25,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +13: [2023-05-13 03:28:25,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +13: [2023-05-13 03:28:25,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +22: [2023-05-13 03:28:25,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +13: [2023-05-13 03:28:25,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +13: [2023-05-13 03:28:25,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +13: [2023-05-13 03:28:25,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +13: [2023-05-13 03:28:25,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +13: [2023-05-13 03:28:25,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +13: [2023-05-13 03:28:25,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +17: [2023-05-13 03:28:25,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +17: [2023-05-13 03:28:25,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +29: [2023-05-13 03:28:25,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +13: [2023-05-13 03:28:25,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +13: [2023-05-13 03:28:25,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +29: [2023-05-13 03:28:25,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +13: [2023-05-13 03:28:25,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +29: [2023-05-13 03:28:25,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +13: [2023-05-13 03:28:25,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +17: [2023-05-13 03:28:25,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +13: [2023-05-13 03:28:25,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +13: [2023-05-13 03:28:25,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +13: [2023-05-13 03:28:25,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +13: [2023-05-13 03:28:25,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +29: [2023-05-13 03:28:25,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +29: [2023-05-13 03:28:25,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +29: [2023-05-13 03:28:25,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +29: [2023-05-13 03:28:25,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +29: [2023-05-13 03:28:25,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +22: [2023-05-13 03:28:25,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +22: [2023-05-13 03:28:25,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +22: [2023-05-13 03:28:25,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +22: [2023-05-13 03:28:25,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +22: [2023-05-13 03:28:25,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +22: [2023-05-13 03:28:25,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +24: [2023-05-13 03:28:25,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +24: [2023-05-13 03:28:25,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +17: [2023-05-13 03:28:25,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +24: [2023-05-13 03:28:25,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +17: [2023-05-13 03:28:25,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +17: [2023-05-13 03:28:25,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +17: [2023-05-13 03:28:25,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +24: [2023-05-13 03:28:25,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +22: [2023-05-13 03:28:25,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +24: [2023-05-13 03:28:25,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +24: [2023-05-13 03:28:25,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +24: [2023-05-13 03:28:25,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +24: [2023-05-13 03:28:25,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +17: [2023-05-13 03:28:25,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +17: [2023-05-13 03:28:25,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +22: [2023-05-13 03:28:25,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +29: [2023-05-13 03:28:25,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +29: [2023-05-13 03:28:25,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +29: [2023-05-13 03:28:25,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +29: [2023-05-13 03:28:25,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +24: [2023-05-13 03:28:25,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +24: [2023-05-13 03:28:25,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +29: [2023-05-13 03:28:25,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +29: [2023-05-13 03:28:25,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +22: [2023-05-13 03:28:25,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +24: [2023-05-13 03:28:25,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +22: [2023-05-13 03:28:25,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +24: [2023-05-13 03:28:25,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +22: [2023-05-13 03:28:25,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +22: [2023-05-13 03:28:25,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +22: [2023-05-13 03:28:25,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +13: [2023-05-13 03:28:25,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +13: [2023-05-13 03:28:25,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +24: [2023-05-13 03:28:25,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +13: [2023-05-13 03:28:25,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +22: [2023-05-13 03:28:25,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +24: [2023-05-13 03:28:25,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +24: [2023-05-13 03:28:25,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +24: [2023-05-13 03:28:25,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +13: [2023-05-13 03:28:25,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +13: [2023-05-13 03:28:25,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +13: [2023-05-13 03:28:25,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +13: [2023-05-13 03:28:25,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +13: [2023-05-13 03:28:25,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +13: [2023-05-13 03:28:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +13: [2023-05-13 03:28:25,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +13: [2023-05-13 03:28:25,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +13: [2023-05-13 03:28:25,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +13: [2023-05-13 03:28:25,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +13: [2023-05-13 03:28:25,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +13: [2023-05-13 03:28:25,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +13: [2023-05-13 03:28:25,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +21: [2023-05-13 03:28:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +21: [2023-05-13 03:28:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +19: [2023-05-13 03:28:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +21: [2023-05-13 03:28:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +21: [2023-05-13 03:28:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +19: [2023-05-13 03:28:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +19: [2023-05-13 03:28:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +19: [2023-05-13 03:28:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +19: [2023-05-13 03:28:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +19: [2023-05-13 03:28:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +21: [2023-05-13 03:28:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +21: [2023-05-13 03:28:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +21: [2023-05-13 03:28:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +19: [2023-05-13 03:28:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +21: [2023-05-13 03:28:25,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +19: [2023-05-13 03:28:25,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +21: [2023-05-13 03:28:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +21: [2023-05-13 03:28:25,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +21: [2023-05-13 03:28:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +19: [2023-05-13 03:28:25,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +19: [2023-05-13 03:28:25,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +19: [2023-05-13 03:28:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +21: [2023-05-13 03:28:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +21: [2023-05-13 03:28:25,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +19: [2023-05-13 03:28:25,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +21: [2023-05-13 03:28:25,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +21: [2023-05-13 03:28:25,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +19: [2023-05-13 03:28:25,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +21: [2023-05-13 03:28:25,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +19: [2023-05-13 03:28:25,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +19: [2023-05-13 03:28:25,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +19: [2023-05-13 03:28:25,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +12: [2023-05-13 03:28:25,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +12: [2023-05-13 03:28:25,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +12: [2023-05-13 03:28:25,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +12: [2023-05-13 03:28:25,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +12: [2023-05-13 03:28:25,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +12: [2023-05-13 03:28:25,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +12: [2023-05-13 03:28:25,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +12: [2023-05-13 03:28:25,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +19: [2023-05-13 03:28:25,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +12: [2023-05-13 03:28:25,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +12: [2023-05-13 03:28:25,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +12: [2023-05-13 03:28:25,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +12: [2023-05-13 03:28:25,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +12: [2023-05-13 03:28:25,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +21: [2023-05-13 03:28:25,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +12: [2023-05-13 03:28:25,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +12: [2023-05-13 03:28:25,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +12: [2023-05-13 03:28:25,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +21: [2023-05-13 03:28:25,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +21: [2023-05-13 03:28:25,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +21: [2023-05-13 03:28:25,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +19: [2023-05-13 03:28:25,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +19: [2023-05-13 03:28:25,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +21: [2023-05-13 03:28:25,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +19: [2023-05-13 03:28:25,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +19: [2023-05-13 03:28:25,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +19: [2023-05-13 03:28:25,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +19: [2023-05-13 03:28:25,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +19: [2023-05-13 03:28:25,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +21: [2023-05-13 03:28:25,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +21: [2023-05-13 03:28:25,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +21: [2023-05-13 03:28:25,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +19: [2023-05-13 03:28:25,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +21: [2023-05-13 03:28:25,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +21: [2023-05-13 03:28:25,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +21: [2023-05-13 03:28:25,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +21: [2023-05-13 03:28:25,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +19: [2023-05-13 03:28:25,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +21: [2023-05-13 03:28:25,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +21: [2023-05-13 03:28:25,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +19: [2023-05-13 03:28:25,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +21: [2023-05-13 03:28:25,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +21: [2023-05-13 03:28:25,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +19: [2023-05-13 03:28:25,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +19: [2023-05-13 03:28:25,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +19: [2023-05-13 03:28:25,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +19: [2023-05-13 03:28:25,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +19: [2023-05-13 03:28:25,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:25,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +12: [2023-05-13 03:28:25,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +12: [2023-05-13 03:28:25,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +12: [2023-05-13 03:28:25,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +12: [2023-05-13 03:28:25,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +12: [2023-05-13 03:28:25,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +12: [2023-05-13 03:28:25,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +12: [2023-05-13 03:28:25,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 0: [2023-05-13 03:28:25,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 0: [2023-05-13 03:28:25,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 0: [2023-05-13 03:28:25,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 0: [2023-05-13 03:28:25,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 0: [2023-05-13 03:28:25,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 0: [2023-05-13 03:28:25,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 0: [2023-05-13 03:28:25,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 0: [2023-05-13 03:28:25,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +12: [2023-05-13 03:28:25,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +12: [2023-05-13 03:28:25,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +12: [2023-05-13 03:28:25,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +23: [2023-05-13 03:28:25,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +23: [2023-05-13 03:28:25,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +23: [2023-05-13 03:28:25,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +23: [2023-05-13 03:28:25,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +23: [2023-05-13 03:28:25,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +23: [2023-05-13 03:28:25,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +23: [2023-05-13 03:28:25,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +23: [2023-05-13 03:28:25,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +11: [2023-05-13 03:28:25,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +11: [2023-05-13 03:28:25,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +11: [2023-05-13 03:28:25,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +11: [2023-05-13 03:28:25,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +11: [2023-05-13 03:28:25,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +11: [2023-05-13 03:28:25,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +11: [2023-05-13 03:28:25,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +12: [2023-05-13 03:28:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +11: [2023-05-13 03:28:25,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +10: [2023-05-13 03:28:25,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +10: [2023-05-13 03:28:25,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +10: [2023-05-13 03:28:25,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +10: [2023-05-13 03:28:25,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +10: [2023-05-13 03:28:25,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +10: [2023-05-13 03:28:25,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +10: [2023-05-13 03:28:25,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +10: [2023-05-13 03:28:25,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +12: [2023-05-13 03:28:25,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +12: [2023-05-13 03:28:25,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +11: [2023-05-13 03:28:25,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +12: [2023-05-13 03:28:25,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +12: [2023-05-13 03:28:25,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +23: [2023-05-13 03:28:25,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +23: [2023-05-13 03:28:25,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +10: [2023-05-13 03:28:25,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +10: [2023-05-13 03:28:25,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +23: [2023-05-13 03:28:25,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +23: [2023-05-13 03:28:25,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +23: [2023-05-13 03:28:25,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +23: [2023-05-13 03:28:25,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +23: [2023-05-13 03:28:25,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +23: [2023-05-13 03:28:25,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +10: [2023-05-13 03:28:25,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +10: [2023-05-13 03:28:25,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +10: [2023-05-13 03:28:25,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +10: [2023-05-13 03:28:25,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +10: [2023-05-13 03:28:25,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +10: [2023-05-13 03:28:25,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +11: [2023-05-13 03:28:25,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +11: [2023-05-13 03:28:25,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +11: [2023-05-13 03:28:25,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +11: [2023-05-13 03:28:25,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +11: [2023-05-13 03:28:25,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +11: [2023-05-13 03:28:25,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +11: [2023-05-13 03:28:25,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +26: [2023-05-13 03:28:25,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +26: [2023-05-13 03:28:25,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +20: [2023-05-13 03:28:25,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +20: [2023-05-13 03:28:25,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +11: [2023-05-13 03:28:25,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +20: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +20: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +20: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +20: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +20: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +16: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +16: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +16: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +25: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +25: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +20: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +16: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +16: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +16: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +16: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +25: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +25: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +25: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +25: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +25: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +16: [2023-05-13 03:28:25,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +25: [2023-05-13 03:28:25,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +26: [2023-05-13 03:28:25,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +26: [2023-05-13 03:28:25,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +26: [2023-05-13 03:28:25,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +26: [2023-05-13 03:28:25,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +26: [2023-05-13 03:28:25,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +26: [2023-05-13 03:28:25,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +15: [2023-05-13 03:28:25,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +18: [2023-05-13 03:28:25,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +26: [2023-05-13 03:28:25,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +26: [2023-05-13 03:28:25,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +15: [2023-05-13 03:28:25,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +15: [2023-05-13 03:28:25,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +15: [2023-05-13 03:28:25,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +18: [2023-05-13 03:28:25,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +18: [2023-05-13 03:28:25,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +18: [2023-05-13 03:28:25,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +18: [2023-05-13 03:28:25,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +18: [2023-05-13 03:28:25,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +18: [2023-05-13 03:28:25,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +15: [2023-05-13 03:28:25,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +15: [2023-05-13 03:28:25,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +15: [2023-05-13 03:28:25,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +15: [2023-05-13 03:28:25,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +18: [2023-05-13 03:28:25,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +10: [2023-05-13 03:28:25,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +10: [2023-05-13 03:28:25,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +20: [2023-05-13 03:28:25,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +28: [2023-05-13 03:28:25,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +28: [2023-05-13 03:28:25,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +28: [2023-05-13 03:28:25,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +28: [2023-05-13 03:28:25,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +28: [2023-05-13 03:28:25,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +28: [2023-05-13 03:28:25,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +28: [2023-05-13 03:28:25,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +28: [2023-05-13 03:28:25,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +20: [2023-05-13 03:28:25,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +16: [2023-05-13 03:28:25,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +25: [2023-05-13 03:28:25,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +25: [2023-05-13 03:28:25,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +25: [2023-05-13 03:28:25,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +16: [2023-05-13 03:28:25,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +23: [2023-05-13 03:28:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +23: [2023-05-13 03:28:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +26: [2023-05-13 03:28:25,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +17: [2023-05-13 03:28:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +16: [2023-05-13 03:28:25,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:25,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +17: [2023-05-13 03:28:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +17: [2023-05-13 03:28:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +17: [2023-05-13 03:28:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +16: [2023-05-13 03:28:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +25: [2023-05-13 03:28:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:25,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +15: [2023-05-13 03:28:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +18: [2023-05-13 03:28:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +16: [2023-05-13 03:28:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +18: [2023-05-13 03:28:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +16: [2023-05-13 03:28:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +18: [2023-05-13 03:28:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +28: [2023-05-13 03:28:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +20: [2023-05-13 03:28:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +25: [2023-05-13 03:28:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +16: [2023-05-13 03:28:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +16: [2023-05-13 03:28:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +20: [2023-05-13 03:28:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +25: [2023-05-13 03:28:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +25: [2023-05-13 03:28:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +25: [2023-05-13 03:28:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +26: [2023-05-13 03:28:25,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +26: [2023-05-13 03:28:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +20: [2023-05-13 03:28:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +20: [2023-05-13 03:28:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +20: [2023-05-13 03:28:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +17: [2023-05-13 03:28:25,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +18: [2023-05-13 03:28:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +20: [2023-05-13 03:28:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt... +18: [2023-05-13 03:28:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +18: [2023-05-13 03:28:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +14: [2023-05-13 03:28:25,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +14: [2023-05-13 03:28:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +14: [2023-05-13 03:28:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +14: [2023-05-13 03:28:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +26: [2023-05-13 03:28:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +26: [2023-05-13 03:28:25,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +14: [2023-05-13 03:28:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +14: [2023-05-13 03:28:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +14: [2023-05-13 03:28:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +14: [2023-05-13 03:28:25,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +26: [2023-05-13 03:28:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +18: [2023-05-13 03:28:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +18: [2023-05-13 03:28:25,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +15: [2023-05-13 03:28:25,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +15: [2023-05-13 03:28:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +15: [2023-05-13 03:28:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +30: [2023-05-13 03:28:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +30: [2023-05-13 03:28:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +30: [2023-05-13 03:28:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 0: [2023-05-13 03:28:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 0: [2023-05-13 03:28:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 0: [2023-05-13 03:28:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 0: [2023-05-13 03:28:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 0: [2023-05-13 03:28:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +30: [2023-05-13 03:28:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 0: [2023-05-13 03:28:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +30: [2023-05-13 03:28:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +17: [2023-05-13 03:28:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +15: [2023-05-13 03:28:25,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +30: [2023-05-13 03:28:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +30: [2023-05-13 03:28:25,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +30: [2023-05-13 03:28:25,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +15: [2023-05-13 03:28:25,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +10: [2023-05-13 03:28:25,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +14: [2023-05-13 03:28:25,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +28: [2023-05-13 03:28:25,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +28: [2023-05-13 03:28:25,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +28: [2023-05-13 03:28:25,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +15: [2023-05-13 03:28:25,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +15: [2023-05-13 03:28:25,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +28: [2023-05-13 03:28:25,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +28: [2023-05-13 03:28:25,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +28: [2023-05-13 03:28:25,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +28: [2023-05-13 03:28:25,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +17: [2023-05-13 03:28:25,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +17: [2023-05-13 03:28:25,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +11: [2023-05-13 03:28:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +14: [2023-05-13 03:28:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +14: [2023-05-13 03:28:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +17: [2023-05-13 03:28:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +17: [2023-05-13 03:28:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +17: [2023-05-13 03:28:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +14: [2023-05-13 03:28:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +14: [2023-05-13 03:28:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +17: [2023-05-13 03:28:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +14: [2023-05-13 03:28:25,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +14: [2023-05-13 03:28:25,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +14: [2023-05-13 03:28:25,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +30: [2023-05-13 03:28:25,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +30: [2023-05-13 03:28:25,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +30: [2023-05-13 03:28:25,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +30: [2023-05-13 03:28:25,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +10: [2023-05-13 03:28:25,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +10: [2023-05-13 03:28:25,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +30: [2023-05-13 03:28:25,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +30: [2023-05-13 03:28:25,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +30: [2023-05-13 03:28:25,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +30: [2023-05-13 03:28:25,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +23: [2023-05-13 03:28:25,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +23: [2023-05-13 03:28:25,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +27: [2023-05-13 03:28:25,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +27: [2023-05-13 03:28:25,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +27: [2023-05-13 03:28:25,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +27: [2023-05-13 03:28:25,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +27: [2023-05-13 03:28:25,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +27: [2023-05-13 03:28:25,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +27: [2023-05-13 03:28:25,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +27: [2023-05-13 03:28:25,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +23: [2023-05-13 03:28:25,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +23: [2023-05-13 03:28:25,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +23: [2023-05-13 03:28:25,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +23: [2023-05-13 03:28:25,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +23: [2023-05-13 03:28:25,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +27: [2023-05-13 03:28:25,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +11: [2023-05-13 03:28:25,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +11: [2023-05-13 03:28:25,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +11: [2023-05-13 03:28:25,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +23: [2023-05-13 03:28:25,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +11: [2023-05-13 03:28:25,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +11: [2023-05-13 03:28:25,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +11: [2023-05-13 03:28:25,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +11: [2023-05-13 03:28:25,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +10: [2023-05-13 03:28:25,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +10: [2023-05-13 03:28:25,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +10: [2023-05-13 03:28:25,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +10: [2023-05-13 03:28:25,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +10: [2023-05-13 03:28:25,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +27: [2023-05-13 03:28:25,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +27: [2023-05-13 03:28:25,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +27: [2023-05-13 03:28:25,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +27: [2023-05-13 03:28:25,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +27: [2023-05-13 03:28:25,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +27: [2023-05-13 03:28:25,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +27: [2023-05-13 03:28:25,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +16: [2023-05-13 03:28:25,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:25,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +28: [2023-05-13 03:28:25,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +26: [2023-05-13 03:28:25,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +26: [2023-05-13 03:28:25,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +26: [2023-05-13 03:28:25,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +25: [2023-05-13 03:28:25,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:25,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +15: [2023-05-13 03:28:25,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +20: [2023-05-13 03:28:25,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +20: [2023-05-13 03:28:25,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:25,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +17: [2023-05-13 03:28:25,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +14: [2023-05-13 03:28:25,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +25: [2023-05-13 03:28:25,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +25: [2023-05-13 03:28:25,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +18: [2023-05-13 03:28:25,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +18: [2023-05-13 03:28:25,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +18: [2023-05-13 03:28:25,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +13: [2023-05-13 03:28:25,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +13: [2023-05-13 03:28:25,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +13: [2023-05-13 03:28:25,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +13: [2023-05-13 03:28:25,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +13: [2023-05-13 03:28:25,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +13: [2023-05-13 03:28:25,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +13: [2023-05-13 03:28:25,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +13: [2023-05-13 03:28:25,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:25,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:25,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:25,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +23: [2023-05-13 03:28:25,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +30: [2023-05-13 03:28:25,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +16: [2023-05-13 03:28:25,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +16: [2023-05-13 03:28:25,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +16: [2023-05-13 03:28:25,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +16: [2023-05-13 03:28:25,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +13: [2023-05-13 03:28:25,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +25: [2023-05-13 03:28:25,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +13: [2023-05-13 03:28:25,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +16: [2023-05-13 03:28:25,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +16: [2023-05-13 03:28:25,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +16: [2023-05-13 03:28:25,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +13: [2023-05-13 03:28:25,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +13: [2023-05-13 03:28:25,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +13: [2023-05-13 03:28:25,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +18: [2023-05-13 03:28:25,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +13: [2023-05-13 03:28:25,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +13: [2023-05-13 03:28:25,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +26: [2023-05-13 03:28:25,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +26: [2023-05-13 03:28:25,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +26: [2023-05-13 03:28:25,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +13: [2023-05-13 03:28:25,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +28: [2023-05-13 03:28:25,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +16: [2023-05-13 03:28:25,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +22: [2023-05-13 03:28:25,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +22: [2023-05-13 03:28:25,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +26: [2023-05-13 03:28:25,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +22: [2023-05-13 03:28:25,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +22: [2023-05-13 03:28:25,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +14: [2023-05-13 03:28:25,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +22: [2023-05-13 03:28:25,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +22: [2023-05-13 03:28:25,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +22: [2023-05-13 03:28:25,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +22: [2023-05-13 03:28:25,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +25: [2023-05-13 03:28:25,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +25: [2023-05-13 03:28:25,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +25: [2023-05-13 03:28:25,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +14: [2023-05-13 03:28:25,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +18: [2023-05-13 03:28:25,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +18: [2023-05-13 03:28:25,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +18: [2023-05-13 03:28:25,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +18: [2023-05-13 03:28:25,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +26: [2023-05-13 03:28:25,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +10: [2023-05-13 03:28:25,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +10: [2023-05-13 03:28:25,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +10: [2023-05-13 03:28:25,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +10: [2023-05-13 03:28:25,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +10: [2023-05-13 03:28:25,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +10: [2023-05-13 03:28:25,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +11: [2023-05-13 03:28:25,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +11: [2023-05-13 03:28:25,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +11: [2023-05-13 03:28:25,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +11: [2023-05-13 03:28:25,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +11: [2023-05-13 03:28:25,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +11: [2023-05-13 03:28:25,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +11: [2023-05-13 03:28:25,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +30: [2023-05-13 03:28:25,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +30: [2023-05-13 03:28:25,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +22: [2023-05-13 03:28:25,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +20: [2023-05-13 03:28:25,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +20: [2023-05-13 03:28:25,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +20: [2023-05-13 03:28:25,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +17: [2023-05-13 03:28:25,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +17: [2023-05-13 03:28:25,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +15: [2023-05-13 03:28:25,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +22: [2023-05-13 03:28:25,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +25: [2023-05-13 03:28:25,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +26: [2023-05-13 03:28:25,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +30: [2023-05-13 03:28:25,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +20: [2023-05-13 03:28:25,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +20: [2023-05-13 03:28:25,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +20: [2023-05-13 03:28:25,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +26: [2023-05-13 03:28:25,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +14: [2023-05-13 03:28:25,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +14: [2023-05-13 03:28:25,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +26: [2023-05-13 03:28:25,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +27: [2023-05-13 03:28:25,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +22: [2023-05-13 03:28:25,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +20: [2023-05-13 03:28:25,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_09-model_00-model_states.pt. +20: [2023-05-13 03:28:25,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +14: [2023-05-13 03:28:25,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +14: [2023-05-13 03:28:25,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +14: [2023-05-13 03:28:25,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +14: [2023-05-13 03:28:25,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +28: [2023-05-13 03:28:25,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +28: [2023-05-13 03:28:25,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +28: [2023-05-13 03:28:25,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +18: [2023-05-13 03:28:25,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +18: [2023-05-13 03:28:25,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +22: [2023-05-13 03:28:25,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +22: [2023-05-13 03:28:25,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +30: [2023-05-13 03:28:25,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +15: [2023-05-13 03:28:25,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +25: [2023-05-13 03:28:25,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +22: [2023-05-13 03:28:25,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +25: [2023-05-13 03:28:25,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +30: [2023-05-13 03:28:25,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +30: [2023-05-13 03:28:25,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +30: [2023-05-13 03:28:25,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +22: [2023-05-13 03:28:25,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +30: [2023-05-13 03:28:25,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +18: [2023-05-13 03:28:25,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +22: [2023-05-13 03:28:25,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +15: [2023-05-13 03:28:25,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +15: [2023-05-13 03:28:25,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +15: [2023-05-13 03:28:25,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +15: [2023-05-13 03:28:25,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +15: [2023-05-13 03:28:25,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +15: [2023-05-13 03:28:25,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +28: [2023-05-13 03:28:25,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +28: [2023-05-13 03:28:25,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +28: [2023-05-13 03:28:25,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +28: [2023-05-13 03:28:25,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +16: [2023-05-13 03:28:25,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +25: [2023-05-13 03:28:25,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +18: [2023-05-13 03:28:25,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +16: [2023-05-13 03:28:25,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +17: [2023-05-13 03:28:25,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +17: [2023-05-13 03:28:25,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +26: [2023-05-13 03:28:25,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +16: [2023-05-13 03:28:25,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +26: [2023-05-13 03:28:25,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +16: [2023-05-13 03:28:25,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +26: [2023-05-13 03:28:25,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +16: [2023-05-13 03:28:25,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +25: [2023-05-13 03:28:25,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +25: [2023-05-13 03:28:25,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +25: [2023-05-13 03:28:25,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +18: [2023-05-13 03:28:25,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +17: [2023-05-13 03:28:25,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +17: [2023-05-13 03:28:25,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +17: [2023-05-13 03:28:25,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +17: [2023-05-13 03:28:25,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +18: [2023-05-13 03:28:25,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +14: [2023-05-13 03:28:25,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +17: [2023-05-13 03:28:25,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +16: [2023-05-13 03:28:25,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +16: [2023-05-13 03:28:25,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +25: [2023-05-13 03:28:25,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +26: [2023-05-13 03:28:25,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +26: [2023-05-13 03:28:25,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +14: [2023-05-13 03:28:25,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +20: [2023-05-13 03:28:25,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +30: [2023-05-13 03:28:25,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +30: [2023-05-13 03:28:25,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +18: [2023-05-13 03:28:25,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +18: [2023-05-13 03:28:25,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +27: [2023-05-13 03:28:25,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +30: [2023-05-13 03:28:25,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +14: [2023-05-13 03:28:25,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +20: [2023-05-13 03:28:25,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +20: [2023-05-13 03:28:25,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +14: [2023-05-13 03:28:25,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +31: [2023-05-13 03:28:25,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +31: [2023-05-13 03:28:25,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +27: [2023-05-13 03:28:25,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +27: [2023-05-13 03:28:25,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +15: [2023-05-13 03:28:25,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +14: [2023-05-13 03:28:25,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +14: [2023-05-13 03:28:25,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +14: [2023-05-13 03:28:25,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +28: [2023-05-13 03:28:25,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +31: [2023-05-13 03:28:25,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +31: [2023-05-13 03:28:25,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +31: [2023-05-13 03:28:25,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +31: [2023-05-13 03:28:25,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +31: [2023-05-13 03:28:25,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +31: [2023-05-13 03:28:25,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +31: [2023-05-13 03:28:25,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +30: [2023-05-13 03:28:25,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +20: [2023-05-13 03:28:25,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +20: [2023-05-13 03:28:25,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +20: [2023-05-13 03:28:25,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +31: [2023-05-13 03:28:25,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +28: [2023-05-13 03:28:25,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +28: [2023-05-13 03:28:25,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +30: [2023-05-13 03:28:25,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +30: [2023-05-13 03:28:25,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +30: [2023-05-13 03:28:25,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +15: [2023-05-13 03:28:25,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +27: [2023-05-13 03:28:25,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +27: [2023-05-13 03:28:25,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +27: [2023-05-13 03:28:25,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +27: [2023-05-13 03:28:25,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +27: [2023-05-13 03:28:25,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +28: [2023-05-13 03:28:25,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +13: [2023-05-13 03:28:25,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +31: [2023-05-13 03:28:25,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +13: [2023-05-13 03:28:25,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +13: [2023-05-13 03:28:25,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +13: [2023-05-13 03:28:25,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +15: [2023-05-13 03:28:25,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +28: [2023-05-13 03:28:25,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +15: [2023-05-13 03:28:25,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +15: [2023-05-13 03:28:25,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:25,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +19: [2023-05-13 03:28:25,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +31: [2023-05-13 03:28:25,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +31: [2023-05-13 03:28:25,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +31: [2023-05-13 03:28:25,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +15: [2023-05-13 03:28:25,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +28: [2023-05-13 03:28:25,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +28: [2023-05-13 03:28:25,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +31: [2023-05-13 03:28:25,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +31: [2023-05-13 03:28:25,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +19: [2023-05-13 03:28:25,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +15: [2023-05-13 03:28:25,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:25,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +19: [2023-05-13 03:28:25,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +19: [2023-05-13 03:28:25,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +19: [2023-05-13 03:28:25,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +19: [2023-05-13 03:28:25,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +21: [2023-05-13 03:28:25,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +21: [2023-05-13 03:28:25,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +21: [2023-05-13 03:28:25,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +21: [2023-05-13 03:28:25,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +21: [2023-05-13 03:28:25,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +21: [2023-05-13 03:28:25,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +21: [2023-05-13 03:28:25,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +21: [2023-05-13 03:28:25,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +22: [2023-05-13 03:28:25,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +17: [2023-05-13 03:28:25,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +17: [2023-05-13 03:28:25,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +17: [2023-05-13 03:28:25,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +13: [2023-05-13 03:28:25,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +17: [2023-05-13 03:28:25,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +21: [2023-05-13 03:28:25,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +21: [2023-05-13 03:28:25,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +21: [2023-05-13 03:28:25,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +19: [2023-05-13 03:28:25,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +19: [2023-05-13 03:28:25,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +19: [2023-05-13 03:28:25,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +24: [2023-05-13 03:28:25,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +17: [2023-05-13 03:28:25,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +24: [2023-05-13 03:28:25,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +17: [2023-05-13 03:28:25,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:25,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +19: [2023-05-13 03:28:25,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +19: [2023-05-13 03:28:25,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +24: [2023-05-13 03:28:25,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +24: [2023-05-13 03:28:25,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +24: [2023-05-13 03:28:25,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +24: [2023-05-13 03:28:25,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +24: [2023-05-13 03:28:25,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +24: [2023-05-13 03:28:25,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +19: [2023-05-13 03:28:25,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +19: [2023-05-13 03:28:25,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +22: [2023-05-13 03:28:25,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +29: [2023-05-13 03:28:25,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +29: [2023-05-13 03:28:25,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +13: [2023-05-13 03:28:25,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +13: [2023-05-13 03:28:25,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +21: [2023-05-13 03:28:25,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +21: [2023-05-13 03:28:25,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +13: [2023-05-13 03:28:25,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +21: [2023-05-13 03:28:25,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +21: [2023-05-13 03:28:25,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +21: [2023-05-13 03:28:25,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +24: [2023-05-13 03:28:25,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +24: [2023-05-13 03:28:25,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +24: [2023-05-13 03:28:25,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +24: [2023-05-13 03:28:25,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +27: [2023-05-13 03:28:25,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +29: [2023-05-13 03:28:25,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +29: [2023-05-13 03:28:25,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +29: [2023-05-13 03:28:25,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +29: [2023-05-13 03:28:25,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +29: [2023-05-13 03:28:25,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +29: [2023-05-13 03:28:25,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +29: [2023-05-13 03:28:25,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +29: [2023-05-13 03:28:25,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +24: [2023-05-13 03:28:25,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +24: [2023-05-13 03:28:25,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +24: [2023-05-13 03:28:25,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +24: [2023-05-13 03:28:25,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +29: [2023-05-13 03:28:25,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +27: [2023-05-13 03:28:25,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +13: [2023-05-13 03:28:25,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +13: [2023-05-13 03:28:25,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +13: [2023-05-13 03:28:25,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +13: [2023-05-13 03:28:25,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +22: [2023-05-13 03:28:25,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +29: [2023-05-13 03:28:25,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +29: [2023-05-13 03:28:25,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +29: [2023-05-13 03:28:25,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +29: [2023-05-13 03:28:25,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +29: [2023-05-13 03:28:25,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +22: [2023-05-13 03:28:25,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +22: [2023-05-13 03:28:25,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +22: [2023-05-13 03:28:25,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +27: [2023-05-13 03:28:25,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +27: [2023-05-13 03:28:25,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +22: [2023-05-13 03:28:25,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +22: [2023-05-13 03:28:25,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +22: [2023-05-13 03:28:25,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +13: [2023-05-13 03:28:25,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +27: [2023-05-13 03:28:25,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +27: [2023-05-13 03:28:25,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +27: [2023-05-13 03:28:25,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +22: [2023-05-13 03:28:25,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +13: [2023-05-13 03:28:25,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +13: [2023-05-13 03:28:25,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +13: [2023-05-13 03:28:25,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +31: [2023-05-13 03:28:25,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +31: [2023-05-13 03:28:25,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 7: [2023-05-13 03:28:25,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 7: [2023-05-13 03:28:25,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +31: [2023-05-13 03:28:25,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +22: [2023-05-13 03:28:25,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +21: [2023-05-13 03:28:25,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +21: [2023-05-13 03:28:25,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +21: [2023-05-13 03:28:25,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +31: [2023-05-13 03:28:25,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +31: [2023-05-13 03:28:25,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +22: [2023-05-13 03:28:25,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:25,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +22: [2023-05-13 03:28:25,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:25,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +19: [2023-05-13 03:28:25,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +19: [2023-05-13 03:28:25,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +29: [2023-05-13 03:28:25,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +29: [2023-05-13 03:28:25,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +22: [2023-05-13 03:28:25,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +22: [2023-05-13 03:28:25,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +24: [2023-05-13 03:28:25,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +24: [2023-05-13 03:28:25,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +19: [2023-05-13 03:28:25,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +24: [2023-05-13 03:28:25,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +24: [2023-05-13 03:28:25,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +22: [2023-05-13 03:28:25,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +21: [2023-05-13 03:28:25,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +21: [2023-05-13 03:28:25,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +31: [2023-05-13 03:28:25,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +31: [2023-05-13 03:28:25,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +31: [2023-05-13 03:28:25,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:25,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +19: [2023-05-13 03:28:25,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +31: [2023-05-13 03:28:25,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +31: [2023-05-13 03:28:25,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +31: [2023-05-13 03:28:25,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +29: [2023-05-13 03:28:25,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +21: [2023-05-13 03:28:25,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +21: [2023-05-13 03:28:25,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +21: [2023-05-13 03:28:25,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:25,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 2: [2023-05-13 03:28:25,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 2: [2023-05-13 03:28:25,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +21: [2023-05-13 03:28:25,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +21: [2023-05-13 03:28:25,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +21: [2023-05-13 03:28:25,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +24: [2023-05-13 03:28:25,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +24: [2023-05-13 03:28:25,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +24: [2023-05-13 03:28:25,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +24: [2023-05-13 03:28:25,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +29: [2023-05-13 03:28:25,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +29: [2023-05-13 03:28:25,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:25,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +24: [2023-05-13 03:28:25,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:25,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +19: [2023-05-13 03:28:25,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +21: [2023-05-13 03:28:25,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +29: [2023-05-13 03:28:25,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +24: [2023-05-13 03:28:25,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +24: [2023-05-13 03:28:25,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:25,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +29: [2023-05-13 03:28:25,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +24: [2023-05-13 03:28:25,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:25,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +21: [2023-05-13 03:28:25,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +29: [2023-05-13 03:28:25,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +29: [2023-05-13 03:28:25,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +29: [2023-05-13 03:28:25,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +29: [2023-05-13 03:28:25,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +31: [2023-05-13 03:28:25,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +21: [2023-05-13 03:28:25,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +21: [2023-05-13 03:28:25,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +21: [2023-05-13 03:28:25,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +31: [2023-05-13 03:28:25,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +31: [2023-05-13 03:28:25,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:25,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +19: [2023-05-13 03:28:25,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +31: [2023-05-13 03:28:25,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +31: [2023-05-13 03:28:25,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +19: [2023-05-13 03:28:25,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +24: [2023-05-13 03:28:25,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +24: [2023-05-13 03:28:25,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +24: [2023-05-13 03:28:25,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +24: [2023-05-13 03:28:25,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 6: [2023-05-13 03:28:25,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 9: [2023-05-13 03:28:25,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +29: [2023-05-13 03:28:25,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 9: [2023-05-13 03:28:25,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +29: [2023-05-13 03:28:25,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +29: [2023-05-13 03:28:25,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +29: [2023-05-13 03:28:25,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +29: [2023-05-13 03:28:25,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 6: [2023-05-13 03:28:25,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:25,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +25: [2023-05-13 03:28:25,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +25: [2023-05-13 03:28:25,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +25: [2023-05-13 03:28:25,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +25: [2023-05-13 03:28:25,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +25: [2023-05-13 03:28:25,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +25: [2023-05-13 03:28:25,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +25: [2023-05-13 03:28:25,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +12: [2023-05-13 03:28:25,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +12: [2023-05-13 03:28:25,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +12: [2023-05-13 03:28:25,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +12: [2023-05-13 03:28:25,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +12: [2023-05-13 03:28:25,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +12: [2023-05-13 03:28:25,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +12: [2023-05-13 03:28:25,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +12: [2023-05-13 03:28:25,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +25: [2023-05-13 03:28:25,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +25: [2023-05-13 03:28:25,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +25: [2023-05-13 03:28:25,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:25,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +12: [2023-05-13 03:28:25,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +12: [2023-05-13 03:28:25,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +12: [2023-05-13 03:28:25,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:25,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:25,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:25,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:25,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:25,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:25,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:25,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +12: [2023-05-13 03:28:25,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +25: [2023-05-13 03:28:25,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +16: [2023-05-13 03:28:25,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +16: [2023-05-13 03:28:25,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +16: [2023-05-13 03:28:25,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +16: [2023-05-13 03:28:25,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +16: [2023-05-13 03:28:25,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +16: [2023-05-13 03:28:25,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +16: [2023-05-13 03:28:25,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +16: [2023-05-13 03:28:25,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +16: [2023-05-13 03:28:25,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +16: [2023-05-13 03:28:25,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +16: [2023-05-13 03:28:25,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +16: [2023-05-13 03:28:25,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +16: [2023-05-13 03:28:25,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +16: [2023-05-13 03:28:25,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +16: [2023-05-13 03:28:25,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:25,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +23: [2023-05-13 03:28:25,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +16: [2023-05-13 03:28:25,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:25,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +23: [2023-05-13 03:28:25,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +23: [2023-05-13 03:28:25,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +23: [2023-05-13 03:28:25,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +23: [2023-05-13 03:28:25,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +23: [2023-05-13 03:28:25,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +20: [2023-05-13 03:28:25,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +20: [2023-05-13 03:28:25,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +23: [2023-05-13 03:28:25,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +23: [2023-05-13 03:28:25,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +20: [2023-05-13 03:28:25,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +20: [2023-05-13 03:28:25,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +20: [2023-05-13 03:28:25,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +20: [2023-05-13 03:28:25,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +20: [2023-05-13 03:28:25,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +20: [2023-05-13 03:28:25,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +20: [2023-05-13 03:28:25,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +20: [2023-05-13 03:28:25,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +23: [2023-05-13 03:28:25,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +23: [2023-05-13 03:28:25,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +23: [2023-05-13 03:28:25,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +23: [2023-05-13 03:28:25,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +23: [2023-05-13 03:28:25,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +23: [2023-05-13 03:28:25,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +20: [2023-05-13 03:28:25,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +20: [2023-05-13 03:28:25,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +20: [2023-05-13 03:28:25,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +20: [2023-05-13 03:28:25,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +20: [2023-05-13 03:28:25,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +20: [2023-05-13 03:28:25,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +12: [2023-05-13 03:28:25,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +12: [2023-05-13 03:28:25,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +25: [2023-05-13 03:28:25,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +25: [2023-05-13 03:28:25,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +25: [2023-05-13 03:28:25,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +12: [2023-05-13 03:28:25,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +25: [2023-05-13 03:28:25,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +12: [2023-05-13 03:28:25,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +12: [2023-05-13 03:28:25,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +12: [2023-05-13 03:28:25,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +12: [2023-05-13 03:28:25,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +12: [2023-05-13 03:28:25,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +21: [2023-05-13 03:28:25,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +21: [2023-05-13 03:28:25,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +25: [2023-05-13 03:28:25,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +25: [2023-05-13 03:28:25,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +25: [2023-05-13 03:28:25,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +25: [2023-05-13 03:28:25,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +21: [2023-05-13 03:28:25,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +21: [2023-05-13 03:28:25,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +21: [2023-05-13 03:28:25,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +21: [2023-05-13 03:28:25,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +21: [2023-05-13 03:28:25,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +21: [2023-05-13 03:28:25,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +21: [2023-05-13 03:28:25,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +21: [2023-05-13 03:28:25,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +12: [2023-05-13 03:28:25,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +12: [2023-05-13 03:28:25,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +21: [2023-05-13 03:28:25,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +25: [2023-05-13 03:28:25,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +21: [2023-05-13 03:28:25,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +21: [2023-05-13 03:28:25,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +12: [2023-05-13 03:28:25,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +21: [2023-05-13 03:28:25,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +21: [2023-05-13 03:28:25,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +21: [2023-05-13 03:28:25,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +25: [2023-05-13 03:28:25,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +25: [2023-05-13 03:28:25,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt... +16: [2023-05-13 03:28:25,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +16: [2023-05-13 03:28:25,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +16: [2023-05-13 03:28:25,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +16: [2023-05-13 03:28:25,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +16: [2023-05-13 03:28:25,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +16: [2023-05-13 03:28:25,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +16: [2023-05-13 03:28:25,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +16: [2023-05-13 03:28:25,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +10: [2023-05-13 03:28:25,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +10: [2023-05-13 03:28:25,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +10: [2023-05-13 03:28:25,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +10: [2023-05-13 03:28:25,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +10: [2023-05-13 03:28:25,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +10: [2023-05-13 03:28:25,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +10: [2023-05-13 03:28:25,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +10: [2023-05-13 03:28:25,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:25,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 4: [2023-05-13 03:28:25,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +23: [2023-05-13 03:28:25,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +23: [2023-05-13 03:28:25,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +19: [2023-05-13 03:28:25,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +19: [2023-05-13 03:28:25,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +10: [2023-05-13 03:28:25,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +10: [2023-05-13 03:28:25,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:25,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +19: [2023-05-13 03:28:25,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +19: [2023-05-13 03:28:25,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +19: [2023-05-13 03:28:25,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +19: [2023-05-13 03:28:25,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +19: [2023-05-13 03:28:25,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +20: [2023-05-13 03:28:25,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +20: [2023-05-13 03:28:25,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +25: [2023-05-13 03:28:25,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +25: [2023-05-13 03:28:25,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +12: [2023-05-13 03:28:25,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +12: [2023-05-13 03:28:25,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +12: [2023-05-13 03:28:25,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +12: [2023-05-13 03:28:25,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +10: [2023-05-13 03:28:25,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +12: [2023-05-13 03:28:25,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +10: [2023-05-13 03:28:25,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:25,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +25: [2023-05-13 03:28:25,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +10: [2023-05-13 03:28:25,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +10: [2023-05-13 03:28:25,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +10: [2023-05-13 03:28:25,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +10: [2023-05-13 03:28:25,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +11: [2023-05-13 03:28:25,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +25: [2023-05-13 03:28:25,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +19: [2023-05-13 03:28:25,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +11: [2023-05-13 03:28:25,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +11: [2023-05-13 03:28:25,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +11: [2023-05-13 03:28:25,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +11: [2023-05-13 03:28:25,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +11: [2023-05-13 03:28:25,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +11: [2023-05-13 03:28:25,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +11: [2023-05-13 03:28:25,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +19: [2023-05-13 03:28:25,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +19: [2023-05-13 03:28:25,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +19: [2023-05-13 03:28:25,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +19: [2023-05-13 03:28:25,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +19: [2023-05-13 03:28:25,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +19: [2023-05-13 03:28:25,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +19: [2023-05-13 03:28:25,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +11: [2023-05-13 03:28:25,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +16: [2023-05-13 03:28:25,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +11: [2023-05-13 03:28:25,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +11: [2023-05-13 03:28:25,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +11: [2023-05-13 03:28:25,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +23: [2023-05-13 03:28:25,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +23: [2023-05-13 03:28:25,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +11: [2023-05-13 03:28:25,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +11: [2023-05-13 03:28:25,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +23: [2023-05-13 03:28:25,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +23: [2023-05-13 03:28:25,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +23: [2023-05-13 03:28:25,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +11: [2023-05-13 03:28:25,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +11: [2023-05-13 03:28:25,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +23: [2023-05-13 03:28:25,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +16: [2023-05-13 03:28:25,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +16: [2023-05-13 03:28:25,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +23: [2023-05-13 03:28:25,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +16: [2023-05-13 03:28:25,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +16: [2023-05-13 03:28:25,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +23: [2023-05-13 03:28:25,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +16: [2023-05-13 03:28:25,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +20: [2023-05-13 03:28:25,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +20: [2023-05-13 03:28:25,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +20: [2023-05-13 03:28:25,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +16: [2023-05-13 03:28:25,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +16: [2023-05-13 03:28:25,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +20: [2023-05-13 03:28:25,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +20: [2023-05-13 03:28:25,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +20: [2023-05-13 03:28:25,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +21: [2023-05-13 03:28:25,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +20: [2023-05-13 03:28:25,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +20: [2023-05-13 03:28:25,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +21: [2023-05-13 03:28:25,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +21: [2023-05-13 03:28:25,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +21: [2023-05-13 03:28:25,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 0: [2023-05-13 03:28:25,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 0: [2023-05-13 03:28:25,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 0: [2023-05-13 03:28:25,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 0: [2023-05-13 03:28:25,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 0: [2023-05-13 03:28:25,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 0: [2023-05-13 03:28:25,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 0: [2023-05-13 03:28:25,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +10: [2023-05-13 03:28:25,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +10: [2023-05-13 03:28:25,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +21: [2023-05-13 03:28:25,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +21: [2023-05-13 03:28:25,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +18: [2023-05-13 03:28:25,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +18: [2023-05-13 03:28:25,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +18: [2023-05-13 03:28:25,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +18: [2023-05-13 03:28:25,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +18: [2023-05-13 03:28:25,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +18: [2023-05-13 03:28:25,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +18: [2023-05-13 03:28:25,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +21: [2023-05-13 03:28:25,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +21: [2023-05-13 03:28:25,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +18: [2023-05-13 03:28:25,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +19: [2023-05-13 03:28:25,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +20: [2023-05-13 03:28:25,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +21: [2023-05-13 03:28:25,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +21: [2023-05-13 03:28:25,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +23: [2023-05-13 03:28:25,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +23: [2023-05-13 03:28:25,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +20: [2023-05-13 03:28:25,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +23: [2023-05-13 03:28:25,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +23: [2023-05-13 03:28:25,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +23: [2023-05-13 03:28:25,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +23: [2023-05-13 03:28:25,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +11: [2023-05-13 03:28:25,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +18: [2023-05-13 03:28:25,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +18: [2023-05-13 03:28:25,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +18: [2023-05-13 03:28:25,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +20: [2023-05-13 03:28:25,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +18: [2023-05-13 03:28:25,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +20: [2023-05-13 03:28:25,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +21: [2023-05-13 03:28:25,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +20: [2023-05-13 03:28:25,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +20: [2023-05-13 03:28:25,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +18: [2023-05-13 03:28:25,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +18: [2023-05-13 03:28:25,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +18: [2023-05-13 03:28:25,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +18: [2023-05-13 03:28:25,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_10-model_00-model_states.pt. +19: [2023-05-13 03:28:25,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +19: [2023-05-13 03:28:25,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +14: [2023-05-13 03:28:25,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +14: [2023-05-13 03:28:25,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +14: [2023-05-13 03:28:25,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +14: [2023-05-13 03:28:25,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +14: [2023-05-13 03:28:25,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +14: [2023-05-13 03:28:25,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +14: [2023-05-13 03:28:25,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +14: [2023-05-13 03:28:25,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +10: [2023-05-13 03:28:25,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +10: [2023-05-13 03:28:25,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +10: [2023-05-13 03:28:25,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +10: [2023-05-13 03:28:25,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +10: [2023-05-13 03:28:25,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +10: [2023-05-13 03:28:25,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +10: [2023-05-13 03:28:25,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +10: [2023-05-13 03:28:25,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +14: [2023-05-13 03:28:25,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +19: [2023-05-13 03:28:25,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +19: [2023-05-13 03:28:25,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +19: [2023-05-13 03:28:25,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +19: [2023-05-13 03:28:25,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +19: [2023-05-13 03:28:25,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +11: [2023-05-13 03:28:25,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +14: [2023-05-13 03:28:25,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +14: [2023-05-13 03:28:25,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +14: [2023-05-13 03:28:25,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +14: [2023-05-13 03:28:25,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +21: [2023-05-13 03:28:25,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +14: [2023-05-13 03:28:25,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +14: [2023-05-13 03:28:25,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +13: [2023-05-13 03:28:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +13: [2023-05-13 03:28:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +13: [2023-05-13 03:28:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +13: [2023-05-13 03:28:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +13: [2023-05-13 03:28:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +13: [2023-05-13 03:28:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +13: [2023-05-13 03:28:25,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +14: [2023-05-13 03:28:25,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +13: [2023-05-13 03:28:25,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 5: [2023-05-13 03:28:25,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +21: [2023-05-13 03:28:25,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 5: [2023-05-13 03:28:25,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +21: [2023-05-13 03:28:25,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +21: [2023-05-13 03:28:25,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +21: [2023-05-13 03:28:25,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +13: [2023-05-13 03:28:25,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +13: [2023-05-13 03:28:25,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +13: [2023-05-13 03:28:25,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +13: [2023-05-13 03:28:25,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +11: [2023-05-13 03:28:25,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +13: [2023-05-13 03:28:25,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +13: [2023-05-13 03:28:25,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +13: [2023-05-13 03:28:25,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +13: [2023-05-13 03:28:25,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +27: [2023-05-13 03:28:25,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +11: [2023-05-13 03:28:25,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +11: [2023-05-13 03:28:25,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +27: [2023-05-13 03:28:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +27: [2023-05-13 03:28:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +27: [2023-05-13 03:28:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +27: [2023-05-13 03:28:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +27: [2023-05-13 03:28:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +27: [2023-05-13 03:28:25,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +27: [2023-05-13 03:28:25,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:25,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 3: [2023-05-13 03:28:25,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +27: [2023-05-13 03:28:25,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +11: [2023-05-13 03:28:25,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +11: [2023-05-13 03:28:25,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +11: [2023-05-13 03:28:25,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +11: [2023-05-13 03:28:25,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +27: [2023-05-13 03:28:25,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +27: [2023-05-13 03:28:25,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +27: [2023-05-13 03:28:25,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +27: [2023-05-13 03:28:25,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +27: [2023-05-13 03:28:25,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +10: [2023-05-13 03:28:25,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +10: [2023-05-13 03:28:25,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 1: [2023-05-13 03:28:25,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +27: [2023-05-13 03:28:25,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +27: [2023-05-13 03:28:25,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +10: [2023-05-13 03:28:25,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 1: [2023-05-13 03:28:25,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +30: [2023-05-13 03:28:25,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +30: [2023-05-13 03:28:25,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +30: [2023-05-13 03:28:25,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +30: [2023-05-13 03:28:25,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +30: [2023-05-13 03:28:25,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +30: [2023-05-13 03:28:25,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +30: [2023-05-13 03:28:25,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +30: [2023-05-13 03:28:25,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +10: [2023-05-13 03:28:25,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +10: [2023-05-13 03:28:25,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +11: [2023-05-13 03:28:25,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +10: [2023-05-13 03:28:25,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +30: [2023-05-13 03:28:25,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +18: [2023-05-13 03:28:25,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +18: [2023-05-13 03:28:25,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +18: [2023-05-13 03:28:25,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +30: [2023-05-13 03:28:25,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +30: [2023-05-13 03:28:25,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +18: [2023-05-13 03:28:25,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +30: [2023-05-13 03:28:25,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +30: [2023-05-13 03:28:25,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +30: [2023-05-13 03:28:25,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:25,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:25,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:25,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:25,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:25,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:25,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:25,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:25,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +30: [2023-05-13 03:28:25,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +30: [2023-05-13 03:28:25,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +11: [2023-05-13 03:28:25,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +11: [2023-05-13 03:28:25,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 8: [2023-05-13 03:28:25,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 8: [2023-05-13 03:28:25,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +18: [2023-05-13 03:28:25,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +11: [2023-05-13 03:28:25,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +28: [2023-05-13 03:28:25,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +28: [2023-05-13 03:28:25,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +28: [2023-05-13 03:28:25,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +28: [2023-05-13 03:28:25,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +28: [2023-05-13 03:28:25,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +28: [2023-05-13 03:28:25,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +28: [2023-05-13 03:28:25,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +11: [2023-05-13 03:28:25,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +28: [2023-05-13 03:28:25,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +11: [2023-05-13 03:28:25,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 0: [2023-05-13 03:28:25,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +11: [2023-05-13 03:28:25,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +28: [2023-05-13 03:28:26,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +14: [2023-05-13 03:28:26,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +14: [2023-05-13 03:28:26,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +14: [2023-05-13 03:28:26,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +14: [2023-05-13 03:28:26,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +18: [2023-05-13 03:28:26,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +18: [2023-05-13 03:28:26,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +18: [2023-05-13 03:28:26,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +18: [2023-05-13 03:28:26,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +18: [2023-05-13 03:28:26,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +18: [2023-05-13 03:28:26,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +18: [2023-05-13 03:28:26,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +13: [2023-05-13 03:28:26,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +13: [2023-05-13 03:28:26,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +13: [2023-05-13 03:28:26,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +28: [2023-05-13 03:28:26,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +28: [2023-05-13 03:28:26,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +28: [2023-05-13 03:28:26,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +28: [2023-05-13 03:28:26,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +28: [2023-05-13 03:28:26,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +28: [2023-05-13 03:28:26,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +28: [2023-05-13 03:28:26,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +14: [2023-05-13 03:28:26,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +27: [2023-05-13 03:28:26,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +14: [2023-05-13 03:28:26,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +14: [2023-05-13 03:28:26,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +13: [2023-05-13 03:28:26,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +14: [2023-05-13 03:28:26,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +18: [2023-05-13 03:28:26,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +13: [2023-05-13 03:28:26,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +13: [2023-05-13 03:28:26,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +13: [2023-05-13 03:28:26,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +13: [2023-05-13 03:28:26,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +17: [2023-05-13 03:28:26,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +14: [2023-05-13 03:28:26,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +17: [2023-05-13 03:28:26,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +17: [2023-05-13 03:28:26,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +17: [2023-05-13 03:28:26,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +17: [2023-05-13 03:28:26,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +17: [2023-05-13 03:28:26,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +17: [2023-05-13 03:28:26,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +17: [2023-05-13 03:28:26,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +14: [2023-05-13 03:28:26,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +14: [2023-05-13 03:28:26,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +17: [2023-05-13 03:28:26,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +18: [2023-05-13 03:28:26,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +14: [2023-05-13 03:28:26,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +18: [2023-05-13 03:28:26,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +18: [2023-05-13 03:28:26,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +30: [2023-05-13 03:28:26,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +17: [2023-05-13 03:28:26,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +13: [2023-05-13 03:28:26,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +13: [2023-05-13 03:28:26,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +13: [2023-05-13 03:28:26,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +17: [2023-05-13 03:28:26,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +27: [2023-05-13 03:28:26,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +17: [2023-05-13 03:28:26,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +17: [2023-05-13 03:28:26,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +30: [2023-05-13 03:28:26,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +17: [2023-05-13 03:28:26,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +30: [2023-05-13 03:28:26,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +17: [2023-05-13 03:28:26,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +17: [2023-05-13 03:28:26,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +30: [2023-05-13 03:28:26,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +27: [2023-05-13 03:28:26,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +26: [2023-05-13 03:28:26,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +26: [2023-05-13 03:28:26,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +14: [2023-05-13 03:28:26,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +26: [2023-05-13 03:28:26,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +26: [2023-05-13 03:28:26,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +26: [2023-05-13 03:28:26,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +26: [2023-05-13 03:28:26,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +26: [2023-05-13 03:28:26,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +26: [2023-05-13 03:28:26,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +14: [2023-05-13 03:28:26,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +14: [2023-05-13 03:28:26,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +14: [2023-05-13 03:28:26,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +13: [2023-05-13 03:28:26,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +27: [2023-05-13 03:28:26,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +27: [2023-05-13 03:28:26,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +26: [2023-05-13 03:28:26,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +26: [2023-05-13 03:28:26,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +26: [2023-05-13 03:28:26,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +28: [2023-05-13 03:28:26,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +13: [2023-05-13 03:28:26,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +13: [2023-05-13 03:28:26,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +13: [2023-05-13 03:28:26,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +13: [2023-05-13 03:28:26,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +26: [2023-05-13 03:28:26,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +26: [2023-05-13 03:28:26,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +30: [2023-05-13 03:28:26,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +26: [2023-05-13 03:28:26,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +26: [2023-05-13 03:28:26,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +26: [2023-05-13 03:28:26,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +30: [2023-05-13 03:28:26,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +30: [2023-05-13 03:28:26,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +30: [2023-05-13 03:28:26,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +30: [2023-05-13 03:28:26,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +30: [2023-05-13 03:28:26,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +30: [2023-05-13 03:28:26,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +30: [2023-05-13 03:28:26,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +28: [2023-05-13 03:28:26,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +27: [2023-05-13 03:28:26,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +27: [2023-05-13 03:28:26,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +27: [2023-05-13 03:28:26,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +27: [2023-05-13 03:28:26,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +27: [2023-05-13 03:28:26,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +27: [2023-05-13 03:28:26,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +27: [2023-05-13 03:28:26,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +17: [2023-05-13 03:28:26,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +28: [2023-05-13 03:28:26,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +20: [2023-05-13 03:28:26,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +20: [2023-05-13 03:28:26,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +28: [2023-05-13 03:28:26,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +28: [2023-05-13 03:28:26,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +30: [2023-05-13 03:28:26,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +30: [2023-05-13 03:28:26,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +30: [2023-05-13 03:28:26,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +30: [2023-05-13 03:28:26,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +28: [2023-05-13 03:28:26,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +28: [2023-05-13 03:28:26,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +28: [2023-05-13 03:28:26,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +28: [2023-05-13 03:28:26,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +31: [2023-05-13 03:28:26,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +31: [2023-05-13 03:28:26,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +20: [2023-05-13 03:28:26,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +20: [2023-05-13 03:28:26,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +20: [2023-05-13 03:28:26,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +20: [2023-05-13 03:28:26,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +29: [2023-05-13 03:28:26,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +29: [2023-05-13 03:28:26,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +20: [2023-05-13 03:28:26,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +20: [2023-05-13 03:28:26,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +20: [2023-05-13 03:28:26,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +31: [2023-05-13 03:28:26,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +31: [2023-05-13 03:28:26,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +31: [2023-05-13 03:28:26,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +31: [2023-05-13 03:28:26,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +31: [2023-05-13 03:28:26,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +31: [2023-05-13 03:28:26,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +25: [2023-05-13 03:28:26,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +25: [2023-05-13 03:28:26,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +29: [2023-05-13 03:28:26,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +15: [2023-05-13 03:28:26,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +29: [2023-05-13 03:28:26,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +29: [2023-05-13 03:28:26,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +29: [2023-05-13 03:28:26,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +29: [2023-05-13 03:28:26,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +25: [2023-05-13 03:28:26,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +25: [2023-05-13 03:28:26,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +29: [2023-05-13 03:28:26,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +15: [2023-05-13 03:28:26,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +15: [2023-05-13 03:28:26,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +15: [2023-05-13 03:28:26,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +31: [2023-05-13 03:28:26,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +31: [2023-05-13 03:28:26,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +15: [2023-05-13 03:28:26,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +25: [2023-05-13 03:28:26,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +25: [2023-05-13 03:28:26,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +25: [2023-05-13 03:28:26,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +15: [2023-05-13 03:28:26,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +15: [2023-05-13 03:28:26,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +25: [2023-05-13 03:28:26,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +15: [2023-05-13 03:28:26,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +29: [2023-05-13 03:28:26,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +29: [2023-05-13 03:28:26,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +15: [2023-05-13 03:28:26,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:26,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +25: [2023-05-13 03:28:26,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +25: [2023-05-13 03:28:26,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +31: [2023-05-13 03:28:26,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +31: [2023-05-13 03:28:26,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +31: [2023-05-13 03:28:26,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +31: [2023-05-13 03:28:26,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +31: [2023-05-13 03:28:26,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +17: [2023-05-13 03:28:26,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +25: [2023-05-13 03:28:26,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +25: [2023-05-13 03:28:26,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +31: [2023-05-13 03:28:26,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +29: [2023-05-13 03:28:26,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:26,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +29: [2023-05-13 03:28:26,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:26,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +25: [2023-05-13 03:28:26,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +29: [2023-05-13 03:28:26,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +29: [2023-05-13 03:28:26,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +29: [2023-05-13 03:28:26,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +27: [2023-05-13 03:28:26,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +29: [2023-05-13 03:28:26,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +15: [2023-05-13 03:28:26,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +15: [2023-05-13 03:28:26,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +27: [2023-05-13 03:28:26,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +27: [2023-05-13 03:28:26,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +26: [2023-05-13 03:28:26,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +26: [2023-05-13 03:28:26,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +26: [2023-05-13 03:28:26,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +28: [2023-05-13 03:28:26,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +15: [2023-05-13 03:28:26,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +27: [2023-05-13 03:28:26,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +15: [2023-05-13 03:28:26,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +15: [2023-05-13 03:28:26,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +15: [2023-05-13 03:28:26,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +15: [2023-05-13 03:28:26,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +17: [2023-05-13 03:28:26,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +22: [2023-05-13 03:28:26,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +22: [2023-05-13 03:28:26,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +16: [2023-05-13 03:28:26,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +16: [2023-05-13 03:28:26,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +22: [2023-05-13 03:28:26,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +22: [2023-05-13 03:28:26,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +22: [2023-05-13 03:28:26,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +22: [2023-05-13 03:28:26,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +22: [2023-05-13 03:28:26,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +22: [2023-05-13 03:28:26,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +24: [2023-05-13 03:28:26,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +24: [2023-05-13 03:28:26,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +24: [2023-05-13 03:28:26,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +24: [2023-05-13 03:28:26,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +24: [2023-05-13 03:28:26,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +24: [2023-05-13 03:28:26,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +24: [2023-05-13 03:28:26,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +24: [2023-05-13 03:28:26,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +16: [2023-05-13 03:28:26,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +16: [2023-05-13 03:28:26,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +16: [2023-05-13 03:28:26,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +16: [2023-05-13 03:28:26,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +16: [2023-05-13 03:28:26,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +26: [2023-05-13 03:28:26,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +16: [2023-05-13 03:28:26,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +17: [2023-05-13 03:28:26,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +28: [2023-05-13 03:28:26,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +28: [2023-05-13 03:28:26,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +22: [2023-05-13 03:28:26,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +16: [2023-05-13 03:28:26,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +16: [2023-05-13 03:28:26,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +22: [2023-05-13 03:28:26,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +24: [2023-05-13 03:28:26,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +17: [2023-05-13 03:28:26,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +17: [2023-05-13 03:28:26,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +24: [2023-05-13 03:28:26,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +24: [2023-05-13 03:28:26,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +26: [2023-05-13 03:28:26,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +26: [2023-05-13 03:28:26,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +26: [2023-05-13 03:28:26,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +24: [2023-05-13 03:28:26,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +24: [2023-05-13 03:28:26,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +24: [2023-05-13 03:28:26,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +22: [2023-05-13 03:28:26,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +24: [2023-05-13 03:28:26,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +24: [2023-05-13 03:28:26,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +22: [2023-05-13 03:28:26,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +28: [2023-05-13 03:28:26,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +17: [2023-05-13 03:28:26,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +16: [2023-05-13 03:28:26,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +16: [2023-05-13 03:28:26,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +28: [2023-05-13 03:28:26,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +22: [2023-05-13 03:28:26,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +16: [2023-05-13 03:28:26,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +26: [2023-05-13 03:28:26,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +22: [2023-05-13 03:28:26,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +22: [2023-05-13 03:28:26,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +22: [2023-05-13 03:28:26,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +16: [2023-05-13 03:28:26,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +16: [2023-05-13 03:28:26,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +16: [2023-05-13 03:28:26,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +17: [2023-05-13 03:28:26,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +28: [2023-05-13 03:28:26,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +28: [2023-05-13 03:28:26,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +26: [2023-05-13 03:28:26,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +26: [2023-05-13 03:28:26,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +26: [2023-05-13 03:28:26,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +20: [2023-05-13 03:28:26,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +20: [2023-05-13 03:28:26,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +20: [2023-05-13 03:28:26,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +20: [2023-05-13 03:28:26,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +20: [2023-05-13 03:28:26,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +20: [2023-05-13 03:28:26,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +20: [2023-05-13 03:28:26,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +17: [2023-05-13 03:28:26,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +17: [2023-05-13 03:28:26,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +26: [2023-05-13 03:28:26,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +31: [2023-05-13 03:28:26,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +29: [2023-05-13 03:28:26,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +29: [2023-05-13 03:28:26,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +12: [2023-05-13 03:28:26,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +12: [2023-05-13 03:28:26,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +12: [2023-05-13 03:28:26,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +26: [2023-05-13 03:28:26,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +12: [2023-05-13 03:28:26,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +12: [2023-05-13 03:28:26,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +12: [2023-05-13 03:28:26,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +12: [2023-05-13 03:28:26,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +26: [2023-05-13 03:28:26,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +12: [2023-05-13 03:28:26,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +17: [2023-05-13 03:28:26,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +26: [2023-05-13 03:28:26,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +31: [2023-05-13 03:28:26,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +15: [2023-05-13 03:28:26,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +17: [2023-05-13 03:28:26,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +26: [2023-05-13 03:28:26,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +25: [2023-05-13 03:28:26,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +25: [2023-05-13 03:28:26,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +25: [2023-05-13 03:28:26,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +12: [2023-05-13 03:28:26,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +12: [2023-05-13 03:28:26,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +12: [2023-05-13 03:28:26,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +12: [2023-05-13 03:28:26,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +12: [2023-05-13 03:28:26,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +12: [2023-05-13 03:28:26,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +12: [2023-05-13 03:28:26,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +19: [2023-05-13 03:28:26,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +19: [2023-05-13 03:28:26,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +19: [2023-05-13 03:28:26,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +19: [2023-05-13 03:28:26,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +19: [2023-05-13 03:28:26,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +19: [2023-05-13 03:28:26,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +19: [2023-05-13 03:28:26,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +19: [2023-05-13 03:28:26,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +12: [2023-05-13 03:28:26,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +17: [2023-05-13 03:28:26,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +17: [2023-05-13 03:28:26,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +17: [2023-05-13 03:28:26,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt... +19: [2023-05-13 03:28:26,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:26,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:26,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:26,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +21: [2023-05-13 03:28:26,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +21: [2023-05-13 03:28:26,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +21: [2023-05-13 03:28:26,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +21: [2023-05-13 03:28:26,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +21: [2023-05-13 03:28:26,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +21: [2023-05-13 03:28:26,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +21: [2023-05-13 03:28:26,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +19: [2023-05-13 03:28:26,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +17: [2023-05-13 03:28:26,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +21: [2023-05-13 03:28:26,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +25: [2023-05-13 03:28:26,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +19: [2023-05-13 03:28:26,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:26,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +29: [2023-05-13 03:28:26,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +29: [2023-05-13 03:28:26,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:26,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:26,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +25: [2023-05-13 03:28:26,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +25: [2023-05-13 03:28:26,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +25: [2023-05-13 03:28:26,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +31: [2023-05-13 03:28:26,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +29: [2023-05-13 03:28:26,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +21: [2023-05-13 03:28:26,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +21: [2023-05-13 03:28:26,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +21: [2023-05-13 03:28:26,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +29: [2023-05-13 03:28:26,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +31: [2023-05-13 03:28:26,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +31: [2023-05-13 03:28:26,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +31: [2023-05-13 03:28:26,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +15: [2023-05-13 03:28:26,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +21: [2023-05-13 03:28:26,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +21: [2023-05-13 03:28:26,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +24: [2023-05-13 03:28:26,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +24: [2023-05-13 03:28:26,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +21: [2023-05-13 03:28:26,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +31: [2023-05-13 03:28:26,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +21: [2023-05-13 03:28:26,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +31: [2023-05-13 03:28:26,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +31: [2023-05-13 03:28:26,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +31: [2023-05-13 03:28:26,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +21: [2023-05-13 03:28:26,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +22: [2023-05-13 03:28:26,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +22: [2023-05-13 03:28:26,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +20: [2023-05-13 03:28:26,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +20: [2023-05-13 03:28:26,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +20: [2023-05-13 03:28:26,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +20: [2023-05-13 03:28:26,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +20: [2023-05-13 03:28:26,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +20: [2023-05-13 03:28:26,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +20: [2023-05-13 03:28:26,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +20: [2023-05-13 03:28:26,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +20: [2023-05-13 03:28:26,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +20: [2023-05-13 03:28:26,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +29: [2023-05-13 03:28:26,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +29: [2023-05-13 03:28:26,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +29: [2023-05-13 03:28:26,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +29: [2023-05-13 03:28:26,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +24: [2023-05-13 03:28:26,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +16: [2023-05-13 03:28:26,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +16: [2023-05-13 03:28:26,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +16: [2023-05-13 03:28:26,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +22: [2023-05-13 03:28:26,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +15: [2023-05-13 03:28:26,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +15: [2023-05-13 03:28:26,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +15: [2023-05-13 03:28:26,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +15: [2023-05-13 03:28:26,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +25: [2023-05-13 03:28:26,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:26,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:26,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +16: [2023-05-13 03:28:26,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +16: [2023-05-13 03:28:26,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +16: [2023-05-13 03:28:26,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +16: [2023-05-13 03:28:26,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +15: [2023-05-13 03:28:26,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +15: [2023-05-13 03:28:26,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +15: [2023-05-13 03:28:26,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +16: [2023-05-13 03:28:26,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +24: [2023-05-13 03:28:26,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +24: [2023-05-13 03:28:26,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +24: [2023-05-13 03:28:26,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +24: [2023-05-13 03:28:26,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +24: [2023-05-13 03:28:26,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +29: [2023-05-13 03:28:26,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +25: [2023-05-13 03:28:26,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:26,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +29: [2023-05-13 03:28:26,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +22: [2023-05-13 03:28:26,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +25: [2023-05-13 03:28:26,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:26,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +31: [2023-05-13 03:28:26,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +25: [2023-05-13 03:28:26,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +22: [2023-05-13 03:28:26,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +22: [2023-05-13 03:28:26,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +22: [2023-05-13 03:28:26,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +22: [2023-05-13 03:28:26,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +24: [2023-05-13 03:28:26,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +22: [2023-05-13 03:28:26,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +24: [2023-05-13 03:28:26,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +23: [2023-05-13 03:28:26,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +23: [2023-05-13 03:28:26,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +23: [2023-05-13 03:28:26,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +23: [2023-05-13 03:28:26,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +23: [2023-05-13 03:28:26,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +22: [2023-05-13 03:28:26,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +23: [2023-05-13 03:28:26,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +23: [2023-05-13 03:28:26,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +23: [2023-05-13 03:28:26,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. +31: [2023-05-13 03:28:26,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +22: [2023-05-13 03:28:26,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +31: [2023-05-13 03:28:26,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +31: [2023-05-13 03:28:26,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +29: [2023-05-13 03:28:26,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +23: [2023-05-13 03:28:26,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +23: [2023-05-13 03:28:26,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +31: [2023-05-13 03:28:26,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +31: [2023-05-13 03:28:26,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +24: [2023-05-13 03:28:26,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +29: [2023-05-13 03:28:26,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +16: [2023-05-13 03:28:26,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +16: [2023-05-13 03:28:26,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +29: [2023-05-13 03:28:26,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +16: [2023-05-13 03:28:26,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +12: [2023-05-13 03:28:26,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +12: [2023-05-13 03:28:26,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +24: [2023-05-13 03:28:26,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +29: [2023-05-13 03:28:26,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +24: [2023-05-13 03:28:26,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +24: [2023-05-13 03:28:26,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +23: [2023-05-13 03:28:26,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +24: [2023-05-13 03:28:26,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +12: [2023-05-13 03:28:26,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +23: [2023-05-13 03:28:26,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +23: [2023-05-13 03:28:26,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +23: [2023-05-13 03:28:26,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +23: [2023-05-13 03:28:26,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +23: [2023-05-13 03:28:26,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +15: [2023-05-13 03:28:26,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +16: [2023-05-13 03:28:26,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +24: [2023-05-13 03:28:26,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +16: [2023-05-13 03:28:26,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +16: [2023-05-13 03:28:26,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +16: [2023-05-13 03:28:26,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +16: [2023-05-13 03:28:26,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +15: [2023-05-13 03:28:26,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +15: [2023-05-13 03:28:26,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +15: [2023-05-13 03:28:26,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +20: [2023-05-13 03:28:26,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +20: [2023-05-13 03:28:26,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +20: [2023-05-13 03:28:26,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +20: [2023-05-13 03:28:26,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +20: [2023-05-13 03:28:26,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +20: [2023-05-13 03:28:26,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:26,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +19: [2023-05-13 03:28:26,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +19: [2023-05-13 03:28:26,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +19: [2023-05-13 03:28:26,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +15: [2023-05-13 03:28:26,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +15: [2023-05-13 03:28:26,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +12: [2023-05-13 03:28:26,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +12: [2023-05-13 03:28:26,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +12: [2023-05-13 03:28:26,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +12: [2023-05-13 03:28:26,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +12: [2023-05-13 03:28:26,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +15: [2023-05-13 03:28:26,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +21: [2023-05-13 03:28:26,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +21: [2023-05-13 03:28:26,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +21: [2023-05-13 03:28:26,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +22: [2023-05-13 03:28:26,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +22: [2023-05-13 03:28:26,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +22: [2023-05-13 03:28:26,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +19: [2023-05-13 03:28:26,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +19: [2023-05-13 03:28:26,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +19: [2023-05-13 03:28:26,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +19: [2023-05-13 03:28:26,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +22: [2023-05-13 03:28:26,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +22: [2023-05-13 03:28:26,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +12: [2023-05-13 03:28:26,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +21: [2023-05-13 03:28:26,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +21: [2023-05-13 03:28:26,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +21: [2023-05-13 03:28:26,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +21: [2023-05-13 03:28:26,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +21: [2023-05-13 03:28:26,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +12: [2023-05-13 03:28:26,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_11-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +12: [2023-05-13 03:28:26,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +21: [2023-05-13 03:28:26,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +21: [2023-05-13 03:28:26,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +21: [2023-05-13 03:28:26,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +19: [2023-05-13 03:28:26,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +19: [2023-05-13 03:28:26,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +11: [2023-05-13 03:28:26,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +11: [2023-05-13 03:28:26,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +11: [2023-05-13 03:28:26,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +11: [2023-05-13 03:28:26,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +11: [2023-05-13 03:28:26,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +11: [2023-05-13 03:28:26,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +11: [2023-05-13 03:28:26,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +11: [2023-05-13 03:28:26,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +19: [2023-05-13 03:28:26,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +19: [2023-05-13 03:28:26,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +11: [2023-05-13 03:28:26,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +12: [2023-05-13 03:28:26,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +12: [2023-05-13 03:28:26,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +12: [2023-05-13 03:28:26,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +12: [2023-05-13 03:28:26,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +12: [2023-05-13 03:28:26,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +11: [2023-05-13 03:28:26,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +11: [2023-05-13 03:28:26,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +11: [2023-05-13 03:28:26,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +11: [2023-05-13 03:28:26,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +23: [2023-05-13 03:28:26,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +23: [2023-05-13 03:28:26,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +11: [2023-05-13 03:28:26,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +11: [2023-05-13 03:28:26,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +11: [2023-05-13 03:28:26,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +19: [2023-05-13 03:28:26,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +21: [2023-05-13 03:28:26,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +19: [2023-05-13 03:28:26,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +19: [2023-05-13 03:28:26,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +21: [2023-05-13 03:28:26,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +21: [2023-05-13 03:28:26,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +19: [2023-05-13 03:28:26,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +21: [2023-05-13 03:28:26,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +21: [2023-05-13 03:28:26,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +10: [2023-05-13 03:28:26,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +10: [2023-05-13 03:28:26,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +10: [2023-05-13 03:28:26,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +10: [2023-05-13 03:28:26,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +10: [2023-05-13 03:28:26,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +10: [2023-05-13 03:28:26,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +10: [2023-05-13 03:28:26,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +10: [2023-05-13 03:28:26,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +23: [2023-05-13 03:28:26,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +23: [2023-05-13 03:28:26,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +23: [2023-05-13 03:28:26,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +23: [2023-05-13 03:28:26,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +23: [2023-05-13 03:28:26,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +23: [2023-05-13 03:28:26,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:26,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +23: [2023-05-13 03:28:26,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +10: [2023-05-13 03:28:26,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +23: [2023-05-13 03:28:26,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:26,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +10: [2023-05-13 03:28:26,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +10: [2023-05-13 03:28:26,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +10: [2023-05-13 03:28:26,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +10: [2023-05-13 03:28:26,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +10: [2023-05-13 03:28:26,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +11: [2023-05-13 03:28:26,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +14: [2023-05-13 03:28:26,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +14: [2023-05-13 03:28:26,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +14: [2023-05-13 03:28:26,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +14: [2023-05-13 03:28:26,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +14: [2023-05-13 03:28:26,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +14: [2023-05-13 03:28:26,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +14: [2023-05-13 03:28:26,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +14: [2023-05-13 03:28:26,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +23: [2023-05-13 03:28:26,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +23: [2023-05-13 03:28:26,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +23: [2023-05-13 03:28:26,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +11: [2023-05-13 03:28:26,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +14: [2023-05-13 03:28:26,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +23: [2023-05-13 03:28:26,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +23: [2023-05-13 03:28:26,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +14: [2023-05-13 03:28:26,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +14: [2023-05-13 03:28:26,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +14: [2023-05-13 03:28:26,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +14: [2023-05-13 03:28:26,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +14: [2023-05-13 03:28:26,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +14: [2023-05-13 03:28:26,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +14: [2023-05-13 03:28:26,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +23: [2023-05-13 03:28:26,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +11: [2023-05-13 03:28:26,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +11: [2023-05-13 03:28:26,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +11: [2023-05-13 03:28:26,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +11: [2023-05-13 03:28:26,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +11: [2023-05-13 03:28:26,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +11: [2023-05-13 03:28:26,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +11: [2023-05-13 03:28:26,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +10: [2023-05-13 03:28:26,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +10: [2023-05-13 03:28:26,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +10: [2023-05-13 03:28:26,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +10: [2023-05-13 03:28:26,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:26,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:26,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +10: [2023-05-13 03:28:26,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +10: [2023-05-13 03:28:26,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +10: [2023-05-13 03:28:26,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +10: [2023-05-13 03:28:26,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +14: [2023-05-13 03:28:26,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +14: [2023-05-13 03:28:26,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +14: [2023-05-13 03:28:26,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +11: [2023-05-13 03:28:26,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +11: [2023-05-13 03:28:26,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +11: [2023-05-13 03:28:26,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +11: [2023-05-13 03:28:26,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +11: [2023-05-13 03:28:26,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +11: [2023-05-13 03:28:26,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +11: [2023-05-13 03:28:26,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +13: [2023-05-13 03:28:26,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +13: [2023-05-13 03:28:26,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +13: [2023-05-13 03:28:26,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +13: [2023-05-13 03:28:26,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +13: [2023-05-13 03:28:26,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +13: [2023-05-13 03:28:26,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +13: [2023-05-13 03:28:26,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +10: [2023-05-13 03:28:26,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +13: [2023-05-13 03:28:26,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +14: [2023-05-13 03:28:26,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +14: [2023-05-13 03:28:26,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +14: [2023-05-13 03:28:26,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +14: [2023-05-13 03:28:26,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +14: [2023-05-13 03:28:26,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +13: [2023-05-13 03:28:26,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +13: [2023-05-13 03:28:26,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +13: [2023-05-13 03:28:26,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +13: [2023-05-13 03:28:26,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +13: [2023-05-13 03:28:26,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +13: [2023-05-13 03:28:26,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +13: [2023-05-13 03:28:26,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +13: [2023-05-13 03:28:26,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +10: [2023-05-13 03:28:26,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:26,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:26,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:26,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:26,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +14: [2023-05-13 03:28:26,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +14: [2023-05-13 03:28:26,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +16: [2023-05-13 03:28:26,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +16: [2023-05-13 03:28:26,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +20: [2023-05-13 03:28:26,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +20: [2023-05-13 03:28:26,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +14: [2023-05-13 03:28:26,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +16: [2023-05-13 03:28:26,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +16: [2023-05-13 03:28:26,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +16: [2023-05-13 03:28:26,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +16: [2023-05-13 03:28:26,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +16: [2023-05-13 03:28:26,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +16: [2023-05-13 03:28:26,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +20: [2023-05-13 03:28:26,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +20: [2023-05-13 03:28:26,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +20: [2023-05-13 03:28:26,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +20: [2023-05-13 03:28:26,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +20: [2023-05-13 03:28:26,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +20: [2023-05-13 03:28:26,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +16: [2023-05-13 03:28:26,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +16: [2023-05-13 03:28:26,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +20: [2023-05-13 03:28:26,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +20: [2023-05-13 03:28:26,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +16: [2023-05-13 03:28:26,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +16: [2023-05-13 03:28:26,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +16: [2023-05-13 03:28:26,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +16: [2023-05-13 03:28:26,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:26,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +25: [2023-05-13 03:28:26,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +20: [2023-05-13 03:28:26,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +14: [2023-05-13 03:28:26,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +16: [2023-05-13 03:28:26,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +16: [2023-05-13 03:28:26,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:26,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +25: [2023-05-13 03:28:26,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +25: [2023-05-13 03:28:26,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +25: [2023-05-13 03:28:26,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +25: [2023-05-13 03:28:26,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +25: [2023-05-13 03:28:26,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +14: [2023-05-13 03:28:26,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +20: [2023-05-13 03:28:26,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +20: [2023-05-13 03:28:26,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +20: [2023-05-13 03:28:26,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +20: [2023-05-13 03:28:26,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +14: [2023-05-13 03:28:26,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +20: [2023-05-13 03:28:26,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +14: [2023-05-13 03:28:26,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +25: [2023-05-13 03:28:26,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:26,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +14: [2023-05-13 03:28:26,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +25: [2023-05-13 03:28:26,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:26,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:26,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:26,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:26,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... +25: [2023-05-13 03:28:26,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +28: [2023-05-13 03:28:26,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +28: [2023-05-13 03:28:26,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +28: [2023-05-13 03:28:26,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +28: [2023-05-13 03:28:26,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +28: [2023-05-13 03:28:26,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +28: [2023-05-13 03:28:26,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +28: [2023-05-13 03:28:26,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +28: [2023-05-13 03:28:26,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +28: [2023-05-13 03:28:26,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +13: [2023-05-13 03:28:26,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +13: [2023-05-13 03:28:26,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +13: [2023-05-13 03:28:26,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +28: [2023-05-13 03:28:26,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +28: [2023-05-13 03:28:26,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +28: [2023-05-13 03:28:26,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +28: [2023-05-13 03:28:26,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +28: [2023-05-13 03:28:26,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +28: [2023-05-13 03:28:26,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +28: [2023-05-13 03:28:26,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +13: [2023-05-13 03:28:26,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +13: [2023-05-13 03:28:26,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +13: [2023-05-13 03:28:26,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +13: [2023-05-13 03:28:26,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +13: [2023-05-13 03:28:26,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +18: [2023-05-13 03:28:26,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +18: [2023-05-13 03:28:26,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +18: [2023-05-13 03:28:26,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +18: [2023-05-13 03:28:26,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +18: [2023-05-13 03:28:26,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +18: [2023-05-13 03:28:26,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +18: [2023-05-13 03:28:26,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +18: [2023-05-13 03:28:26,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +30: [2023-05-13 03:28:26,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +30: [2023-05-13 03:28:26,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +30: [2023-05-13 03:28:26,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +30: [2023-05-13 03:28:26,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +30: [2023-05-13 03:28:26,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +30: [2023-05-13 03:28:26,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +30: [2023-05-13 03:28:26,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +30: [2023-05-13 03:28:26,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +18: [2023-05-13 03:28:26,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +18: [2023-05-13 03:28:26,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +18: [2023-05-13 03:28:26,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +30: [2023-05-13 03:28:26,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +13: [2023-05-13 03:28:26,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +20: [2023-05-13 03:28:26,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +20: [2023-05-13 03:28:26,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +30: [2023-05-13 03:28:26,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +18: [2023-05-13 03:28:26,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +18: [2023-05-13 03:28:26,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +13: [2023-05-13 03:28:26,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +13: [2023-05-13 03:28:26,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +30: [2023-05-13 03:28:26,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +16: [2023-05-13 03:28:26,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +16: [2023-05-13 03:28:26,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +16: [2023-05-13 03:28:26,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +18: [2023-05-13 03:28:26,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +30: [2023-05-13 03:28:26,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +18: [2023-05-13 03:28:26,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +30: [2023-05-13 03:28:26,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +18: [2023-05-13 03:28:26,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +30: [2023-05-13 03:28:26,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +17: [2023-05-13 03:28:26,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +30: [2023-05-13 03:28:26,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +17: [2023-05-13 03:28:26,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +17: [2023-05-13 03:28:26,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +17: [2023-05-13 03:28:26,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +17: [2023-05-13 03:28:26,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +17: [2023-05-13 03:28:26,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +17: [2023-05-13 03:28:26,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +30: [2023-05-13 03:28:26,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +17: [2023-05-13 03:28:26,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +16: [2023-05-13 03:28:26,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +16: [2023-05-13 03:28:26,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +16: [2023-05-13 03:28:26,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +16: [2023-05-13 03:28:26,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +17: [2023-05-13 03:28:26,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +16: [2023-05-13 03:28:26,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +31: [2023-05-13 03:28:26,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +31: [2023-05-13 03:28:26,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +31: [2023-05-13 03:28:26,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +31: [2023-05-13 03:28:26,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +31: [2023-05-13 03:28:26,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +31: [2023-05-13 03:28:26,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +31: [2023-05-13 03:28:26,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +31: [2023-05-13 03:28:26,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +25: [2023-05-13 03:28:26,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +25: [2023-05-13 03:28:26,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +25: [2023-05-13 03:28:26,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +31: [2023-05-13 03:28:26,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +31: [2023-05-13 03:28:26,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +17: [2023-05-13 03:28:26,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +17: [2023-05-13 03:28:26,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +17: [2023-05-13 03:28:26,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +25: [2023-05-13 03:28:26,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +17: [2023-05-13 03:28:26,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +17: [2023-05-13 03:28:26,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +31: [2023-05-13 03:28:26,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +17: [2023-05-13 03:28:26,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +17: [2023-05-13 03:28:26,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +25: [2023-05-13 03:28:26,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +20: [2023-05-13 03:28:26,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +31: [2023-05-13 03:28:26,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +31: [2023-05-13 03:28:26,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +31: [2023-05-13 03:28:26,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +13: [2023-05-13 03:28:26,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +31: [2023-05-13 03:28:26,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +31: [2023-05-13 03:28:26,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +13: [2023-05-13 03:28:26,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +13: [2023-05-13 03:28:26,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +13: [2023-05-13 03:28:26,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +20: [2023-05-13 03:28:26,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +20: [2023-05-13 03:28:26,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +20: [2023-05-13 03:28:26,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +20: [2023-05-13 03:28:26,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +13: [2023-05-13 03:28:26,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +20: [2023-05-13 03:28:26,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +28: [2023-05-13 03:28:26,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +25: [2023-05-13 03:28:26,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +25: [2023-05-13 03:28:26,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +25: [2023-05-13 03:28:26,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_12-model_00-model_states.pt. +15: [2023-05-13 03:28:26,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +15: [2023-05-13 03:28:26,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +15: [2023-05-13 03:28:26,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +15: [2023-05-13 03:28:26,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +15: [2023-05-13 03:28:26,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +15: [2023-05-13 03:28:26,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +15: [2023-05-13 03:28:26,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +20: [2023-05-13 03:28:26,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +15: [2023-05-13 03:28:26,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +20: [2023-05-13 03:28:26,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +16: [2023-05-13 03:28:26,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +16: [2023-05-13 03:28:26,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +15: [2023-05-13 03:28:26,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +25: [2023-05-13 03:28:26,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +16: [2023-05-13 03:28:26,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +16: [2023-05-13 03:28:26,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +22: [2023-05-13 03:28:26,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +22: [2023-05-13 03:28:26,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +22: [2023-05-13 03:28:26,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +22: [2023-05-13 03:28:26,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +22: [2023-05-13 03:28:26,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +22: [2023-05-13 03:28:26,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +22: [2023-05-13 03:28:26,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +22: [2023-05-13 03:28:26,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +25: [2023-05-13 03:28:26,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +25: [2023-05-13 03:28:26,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +15: [2023-05-13 03:28:26,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +15: [2023-05-13 03:28:26,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +16: [2023-05-13 03:28:26,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +16: [2023-05-13 03:28:26,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +16: [2023-05-13 03:28:26,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +15: [2023-05-13 03:28:26,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +15: [2023-05-13 03:28:26,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +15: [2023-05-13 03:28:26,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +15: [2023-05-13 03:28:26,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +27: [2023-05-13 03:28:26,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +15: [2023-05-13 03:28:26,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +16: [2023-05-13 03:28:26,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +27: [2023-05-13 03:28:26,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +27: [2023-05-13 03:28:26,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +27: [2023-05-13 03:28:26,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +27: [2023-05-13 03:28:26,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +27: [2023-05-13 03:28:26,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +27: [2023-05-13 03:28:26,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +27: [2023-05-13 03:28:26,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +22: [2023-05-13 03:28:26,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +22: [2023-05-13 03:28:26,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +25: [2023-05-13 03:28:26,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +28: [2023-05-13 03:28:26,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +22: [2023-05-13 03:28:26,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +20: [2023-05-13 03:28:26,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +27: [2023-05-13 03:28:26,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +30: [2023-05-13 03:28:26,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +22: [2023-05-13 03:28:26,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +22: [2023-05-13 03:28:26,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +22: [2023-05-13 03:28:26,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +22: [2023-05-13 03:28:26,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +29: [2023-05-13 03:28:26,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +29: [2023-05-13 03:28:26,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +22: [2023-05-13 03:28:26,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +28: [2023-05-13 03:28:26,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +25: [2023-05-13 03:28:26,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +29: [2023-05-13 03:28:26,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +29: [2023-05-13 03:28:26,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +29: [2023-05-13 03:28:26,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +29: [2023-05-13 03:28:26,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +29: [2023-05-13 03:28:26,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +29: [2023-05-13 03:28:26,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +29: [2023-05-13 03:28:26,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +25: [2023-05-13 03:28:26,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +29: [2023-05-13 03:28:26,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +27: [2023-05-13 03:28:26,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +27: [2023-05-13 03:28:26,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +25: [2023-05-13 03:28:26,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +27: [2023-05-13 03:28:26,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +18: [2023-05-13 03:28:26,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +18: [2023-05-13 03:28:26,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +18: [2023-05-13 03:28:26,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +27: [2023-05-13 03:28:26,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +27: [2023-05-13 03:28:26,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +25: [2023-05-13 03:28:26,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +27: [2023-05-13 03:28:26,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +27: [2023-05-13 03:28:26,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +19: [2023-05-13 03:28:26,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +19: [2023-05-13 03:28:26,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +30: [2023-05-13 03:28:26,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +19: [2023-05-13 03:28:26,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +20: [2023-05-13 03:28:26,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +19: [2023-05-13 03:28:26,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +19: [2023-05-13 03:28:26,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +19: [2023-05-13 03:28:26,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +19: [2023-05-13 03:28:26,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +19: [2023-05-13 03:28:26,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +17: [2023-05-13 03:28:26,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +28: [2023-05-13 03:28:26,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +28: [2023-05-13 03:28:26,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +28: [2023-05-13 03:28:26,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +20: [2023-05-13 03:28:26,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +29: [2023-05-13 03:28:26,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +29: [2023-05-13 03:28:26,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +30: [2023-05-13 03:28:26,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +20: [2023-05-13 03:28:26,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +29: [2023-05-13 03:28:26,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +19: [2023-05-13 03:28:26,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +19: [2023-05-13 03:28:26,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +29: [2023-05-13 03:28:26,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +20: [2023-05-13 03:28:26,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +18: [2023-05-13 03:28:26,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +26: [2023-05-13 03:28:26,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +26: [2023-05-13 03:28:26,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +26: [2023-05-13 03:28:26,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +20: [2023-05-13 03:28:26,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +29: [2023-05-13 03:28:26,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +30: [2023-05-13 03:28:26,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +29: [2023-05-13 03:28:26,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +26: [2023-05-13 03:28:26,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +26: [2023-05-13 03:28:26,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +26: [2023-05-13 03:28:26,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +26: [2023-05-13 03:28:26,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +26: [2023-05-13 03:28:26,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +28: [2023-05-13 03:28:26,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +28: [2023-05-13 03:28:26,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +28: [2023-05-13 03:28:26,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +19: [2023-05-13 03:28:26,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +31: [2023-05-13 03:28:26,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +31: [2023-05-13 03:28:26,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +30: [2023-05-13 03:28:26,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +30: [2023-05-13 03:28:26,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +30: [2023-05-13 03:28:26,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +30: [2023-05-13 03:28:26,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +19: [2023-05-13 03:28:26,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +19: [2023-05-13 03:28:26,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +26: [2023-05-13 03:28:26,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +26: [2023-05-13 03:28:26,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +19: [2023-05-13 03:28:26,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +19: [2023-05-13 03:28:26,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +26: [2023-05-13 03:28:26,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +18: [2023-05-13 03:28:26,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +18: [2023-05-13 03:28:26,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +18: [2023-05-13 03:28:26,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +18: [2023-05-13 03:28:26,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +19: [2023-05-13 03:28:26,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +30: [2023-05-13 03:28:26,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +24: [2023-05-13 03:28:26,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +24: [2023-05-13 03:28:26,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +24: [2023-05-13 03:28:26,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +24: [2023-05-13 03:28:26,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +24: [2023-05-13 03:28:26,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +24: [2023-05-13 03:28:26,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +24: [2023-05-13 03:28:26,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +24: [2023-05-13 03:28:26,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +28: [2023-05-13 03:28:26,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +26: [2023-05-13 03:28:26,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +26: [2023-05-13 03:28:26,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +26: [2023-05-13 03:28:26,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +26: [2023-05-13 03:28:26,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +26: [2023-05-13 03:28:26,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +24: [2023-05-13 03:28:26,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +18: [2023-05-13 03:28:26,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +24: [2023-05-13 03:28:26,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +18: [2023-05-13 03:28:26,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +24: [2023-05-13 03:28:26,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +24: [2023-05-13 03:28:26,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +24: [2023-05-13 03:28:26,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +18: [2023-05-13 03:28:26,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +24: [2023-05-13 03:28:26,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +24: [2023-05-13 03:28:26,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +17: [2023-05-13 03:28:26,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +24: [2023-05-13 03:28:26,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +31: [2023-05-13 03:28:26,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +30: [2023-05-13 03:28:26,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +15: [2023-05-13 03:28:26,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +30: [2023-05-13 03:28:26,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +31: [2023-05-13 03:28:26,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +28: [2023-05-13 03:28:26,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +31: [2023-05-13 03:28:26,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +28: [2023-05-13 03:28:26,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +28: [2023-05-13 03:28:26,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +18: [2023-05-13 03:28:26,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +30: [2023-05-13 03:28:26,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +17: [2023-05-13 03:28:26,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +17: [2023-05-13 03:28:26,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +17: [2023-05-13 03:28:26,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +31: [2023-05-13 03:28:26,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +31: [2023-05-13 03:28:26,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +18: [2023-05-13 03:28:26,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +31: [2023-05-13 03:28:26,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +30: [2023-05-13 03:28:26,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +17: [2023-05-13 03:28:26,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +17: [2023-05-13 03:28:26,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +17: [2023-05-13 03:28:26,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +17: [2023-05-13 03:28:26,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +22: [2023-05-13 03:28:26,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +22: [2023-05-13 03:28:26,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +28: [2023-05-13 03:28:26,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +18: [2023-05-13 03:28:26,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +30: [2023-05-13 03:28:26,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +31: [2023-05-13 03:28:26,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +31: [2023-05-13 03:28:26,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +28: [2023-05-13 03:28:26,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +27: [2023-05-13 03:28:26,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +30: [2023-05-13 03:28:26,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +30: [2023-05-13 03:28:26,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +18: [2023-05-13 03:28:26,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +18: [2023-05-13 03:28:26,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +31: [2023-05-13 03:28:26,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +28: [2023-05-13 03:28:26,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +29: [2023-05-13 03:28:26,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +29: [2023-05-13 03:28:26,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +15: [2023-05-13 03:28:26,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +15: [2023-05-13 03:28:26,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +22: [2023-05-13 03:28:26,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +15: [2023-05-13 03:28:26,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +15: [2023-05-13 03:28:26,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +15: [2023-05-13 03:28:26,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +22: [2023-05-13 03:28:26,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +22: [2023-05-13 03:28:26,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +15: [2023-05-13 03:28:26,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +15: [2023-05-13 03:28:26,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +15: [2023-05-13 03:28:26,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +19: [2023-05-13 03:28:26,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +19: [2023-05-13 03:28:26,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +27: [2023-05-13 03:28:26,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +22: [2023-05-13 03:28:26,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +22: [2023-05-13 03:28:26,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +22: [2023-05-13 03:28:26,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +22: [2023-05-13 03:28:26,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +26: [2023-05-13 03:28:26,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +26: [2023-05-13 03:28:26,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +26: [2023-05-13 03:28:26,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +29: [2023-05-13 03:28:26,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +17: [2023-05-13 03:28:26,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +19: [2023-05-13 03:28:26,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +31: [2023-05-13 03:28:26,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +31: [2023-05-13 03:28:26,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +29: [2023-05-13 03:28:26,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +12: [2023-05-13 03:28:26,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +22: [2023-05-13 03:28:26,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +12: [2023-05-13 03:28:26,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +12: [2023-05-13 03:28:26,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +12: [2023-05-13 03:28:26,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +12: [2023-05-13 03:28:26,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +12: [2023-05-13 03:28:26,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +12: [2023-05-13 03:28:26,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +12: [2023-05-13 03:28:26,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +31: [2023-05-13 03:28:26,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +27: [2023-05-13 03:28:26,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +29: [2023-05-13 03:28:26,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +29: [2023-05-13 03:28:26,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +31: [2023-05-13 03:28:26,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +17: [2023-05-13 03:28:26,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +17: [2023-05-13 03:28:26,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +27: [2023-05-13 03:28:26,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +31: [2023-05-13 03:28:26,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +19: [2023-05-13 03:28:26,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +19: [2023-05-13 03:28:26,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +17: [2023-05-13 03:28:26,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +12: [2023-05-13 03:28:26,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +12: [2023-05-13 03:28:26,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +17: [2023-05-13 03:28:26,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +12: [2023-05-13 03:28:26,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +12: [2023-05-13 03:28:26,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +17: [2023-05-13 03:28:26,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +12: [2023-05-13 03:28:26,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +29: [2023-05-13 03:28:26,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +29: [2023-05-13 03:28:26,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +12: [2023-05-13 03:28:26,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +29: [2023-05-13 03:28:26,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +29: [2023-05-13 03:28:26,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +12: [2023-05-13 03:28:26,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +12: [2023-05-13 03:28:26,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +26: [2023-05-13 03:28:26,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +26: [2023-05-13 03:28:26,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +26: [2023-05-13 03:28:26,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +27: [2023-05-13 03:28:26,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +27: [2023-05-13 03:28:26,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +27: [2023-05-13 03:28:26,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +27: [2023-05-13 03:28:26,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +27: [2023-05-13 03:28:26,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +19: [2023-05-13 03:28:26,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +19: [2023-05-13 03:28:26,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +19: [2023-05-13 03:28:26,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +24: [2023-05-13 03:28:26,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +24: [2023-05-13 03:28:26,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +24: [2023-05-13 03:28:26,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +24: [2023-05-13 03:28:26,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +24: [2023-05-13 03:28:26,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +17: [2023-05-13 03:28:26,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +21: [2023-05-13 03:28:26,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +21: [2023-05-13 03:28:26,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +21: [2023-05-13 03:28:26,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +22: [2023-05-13 03:28:26,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +21: [2023-05-13 03:28:26,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +21: [2023-05-13 03:28:26,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +26: [2023-05-13 03:28:26,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +26: [2023-05-13 03:28:26,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +21: [2023-05-13 03:28:26,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +21: [2023-05-13 03:28:26,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +21: [2023-05-13 03:28:26,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +22: [2023-05-13 03:28:26,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +21: [2023-05-13 03:28:26,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +21: [2023-05-13 03:28:26,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +21: [2023-05-13 03:28:26,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +23: [2023-05-13 03:28:26,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +23: [2023-05-13 03:28:26,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +22: [2023-05-13 03:28:26,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +19: [2023-05-13 03:28:26,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +19: [2023-05-13 03:28:26,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +23: [2023-05-13 03:28:26,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +23: [2023-05-13 03:28:26,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +23: [2023-05-13 03:28:26,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +23: [2023-05-13 03:28:26,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +23: [2023-05-13 03:28:26,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +23: [2023-05-13 03:28:26,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +24: [2023-05-13 03:28:26,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +21: [2023-05-13 03:28:26,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +21: [2023-05-13 03:28:26,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +21: [2023-05-13 03:28:26,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +23: [2023-05-13 03:28:26,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +21: [2023-05-13 03:28:26,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +26: [2023-05-13 03:28:26,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +26: [2023-05-13 03:28:26,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +21: [2023-05-13 03:28:26,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +26: [2023-05-13 03:28:26,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +23: [2023-05-13 03:28:26,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +22: [2023-05-13 03:28:26,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +23: [2023-05-13 03:28:26,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +19: [2023-05-13 03:28:26,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +22: [2023-05-13 03:28:26,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +22: [2023-05-13 03:28:26,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +24: [2023-05-13 03:28:26,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +24: [2023-05-13 03:28:26,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +23: [2023-05-13 03:28:26,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +23: [2023-05-13 03:28:26,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +23: [2023-05-13 03:28:26,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +23: [2023-05-13 03:28:26,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +23: [2023-05-13 03:28:26,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +29: [2023-05-13 03:28:26,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +15: [2023-05-13 03:28:26,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +15: [2023-05-13 03:28:26,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +15: [2023-05-13 03:28:26,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +15: [2023-05-13 03:28:26,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +15: [2023-05-13 03:28:26,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +15: [2023-05-13 03:28:26,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +15: [2023-05-13 03:28:26,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +26: [2023-05-13 03:28:26,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +27: [2023-05-13 03:28:26,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +19: [2023-05-13 03:28:26,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +26: [2023-05-13 03:28:26,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +24: [2023-05-13 03:28:26,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +26: [2023-05-13 03:28:26,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +24: [2023-05-13 03:28:26,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +27: [2023-05-13 03:28:26,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +29: [2023-05-13 03:28:26,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +19: [2023-05-13 03:28:26,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +29: [2023-05-13 03:28:26,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +29: [2023-05-13 03:28:26,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +29: [2023-05-13 03:28:26,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +29: [2023-05-13 03:28:26,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +19: [2023-05-13 03:28:26,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +19: [2023-05-13 03:28:26,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +26: [2023-05-13 03:28:26,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +26: [2023-05-13 03:28:26,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +19: [2023-05-13 03:28:26,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +24: [2023-05-13 03:28:26,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +24: [2023-05-13 03:28:26,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +24: [2023-05-13 03:28:26,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +27: [2023-05-13 03:28:26,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +27: [2023-05-13 03:28:26,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +24: [2023-05-13 03:28:26,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +27: [2023-05-13 03:28:26,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +24: [2023-05-13 03:28:26,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +27: [2023-05-13 03:28:26,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +24: [2023-05-13 03:28:26,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +27: [2023-05-13 03:28:26,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +12: [2023-05-13 03:28:26,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 7: [2023-05-13 03:28:26,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +12: [2023-05-13 03:28:26,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +12: [2023-05-13 03:28:26,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 7: [2023-05-13 03:28:26,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 1: [2023-05-13 03:28:26,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 1: [2023-05-13 03:28:26,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +21: [2023-05-13 03:28:26,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +21: [2023-05-13 03:28:26,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +21: [2023-05-13 03:28:26,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +12: [2023-05-13 03:28:26,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +12: [2023-05-13 03:28:26,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +12: [2023-05-13 03:28:26,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +12: [2023-05-13 03:28:26,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +12: [2023-05-13 03:28:26,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +23: [2023-05-13 03:28:26,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +23: [2023-05-13 03:28:26,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 9: [2023-05-13 03:28:26,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 9: [2023-05-13 03:28:26,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +21: [2023-05-13 03:28:26,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +12: [2023-05-13 03:28:26,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +12: [2023-05-13 03:28:26,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +21: [2023-05-13 03:28:26,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +21: [2023-05-13 03:28:26,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +21: [2023-05-13 03:28:26,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +21: [2023-05-13 03:28:26,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +12: [2023-05-13 03:28:26,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +16: [2023-05-13 03:28:26,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +16: [2023-05-13 03:28:26,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +20: [2023-05-13 03:28:26,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +20: [2023-05-13 03:28:26,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +16: [2023-05-13 03:28:26,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +16: [2023-05-13 03:28:26,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +16: [2023-05-13 03:28:26,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +16: [2023-05-13 03:28:26,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +16: [2023-05-13 03:28:26,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +21: [2023-05-13 03:28:26,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +16: [2023-05-13 03:28:26,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +21: [2023-05-13 03:28:26,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +21: [2023-05-13 03:28:26,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +20: [2023-05-13 03:28:26,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +20: [2023-05-13 03:28:26,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +20: [2023-05-13 03:28:26,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +20: [2023-05-13 03:28:26,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +20: [2023-05-13 03:28:26,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +20: [2023-05-13 03:28:26,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +16: [2023-05-13 03:28:26,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +16: [2023-05-13 03:28:26,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +20: [2023-05-13 03:28:26,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +20: [2023-05-13 03:28:26,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +16: [2023-05-13 03:28:26,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +23: [2023-05-13 03:28:26,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +23: [2023-05-13 03:28:26,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +16: [2023-05-13 03:28:26,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +16: [2023-05-13 03:28:26,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +16: [2023-05-13 03:28:26,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +16: [2023-05-13 03:28:26,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +16: [2023-05-13 03:28:26,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +23: [2023-05-13 03:28:26,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +23: [2023-05-13 03:28:26,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +11: [2023-05-13 03:28:26,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +11: [2023-05-13 03:28:26,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +11: [2023-05-13 03:28:26,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +11: [2023-05-13 03:28:26,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +11: [2023-05-13 03:28:26,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +11: [2023-05-13 03:28:26,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +11: [2023-05-13 03:28:26,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +23: [2023-05-13 03:28:26,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +23: [2023-05-13 03:28:26,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +11: [2023-05-13 03:28:26,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +12: [2023-05-13 03:28:26,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +23: [2023-05-13 03:28:26,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +23: [2023-05-13 03:28:26,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +20: [2023-05-13 03:28:26,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +20: [2023-05-13 03:28:26,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 2: [2023-05-13 03:28:26,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +20: [2023-05-13 03:28:26,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +20: [2023-05-13 03:28:26,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +11: [2023-05-13 03:28:26,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +20: [2023-05-13 03:28:26,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +20: [2023-05-13 03:28:26,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... + 2: [2023-05-13 03:28:26,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +12: [2023-05-13 03:28:26,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +12: [2023-05-13 03:28:26,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +12: [2023-05-13 03:28:26,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +12: [2023-05-13 03:28:26,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +14: [2023-05-13 03:28:26,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +14: [2023-05-13 03:28:26,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +14: [2023-05-13 03:28:26,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +14: [2023-05-13 03:28:26,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +21: [2023-05-13 03:28:26,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +14: [2023-05-13 03:28:26,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +14: [2023-05-13 03:28:26,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +14: [2023-05-13 03:28:26,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +14: [2023-05-13 03:28:26,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +11: [2023-05-13 03:28:26,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +11: [2023-05-13 03:28:26,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +11: [2023-05-13 03:28:26,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +11: [2023-05-13 03:28:26,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +11: [2023-05-13 03:28:26,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +11: [2023-05-13 03:28:26,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +11: [2023-05-13 03:28:26,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +14: [2023-05-13 03:28:26,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +14: [2023-05-13 03:28:26,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +21: [2023-05-13 03:28:26,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +14: [2023-05-13 03:28:26,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +21: [2023-05-13 03:28:26,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +21: [2023-05-13 03:28:26,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +21: [2023-05-13 03:28:26,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +14: [2023-05-13 03:28:26,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +14: [2023-05-13 03:28:26,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +14: [2023-05-13 03:28:26,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +14: [2023-05-13 03:28:26,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +14: [2023-05-13 03:28:26,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +23: [2023-05-13 03:28:26,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +23: [2023-05-13 03:28:26,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +23: [2023-05-13 03:28:26,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +23: [2023-05-13 03:28:26,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +23: [2023-05-13 03:28:26,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 6: [2023-05-13 03:28:26,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +23: [2023-05-13 03:28:26,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 6: [2023-05-13 03:28:26,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +13: [2023-05-13 03:28:26,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +13: [2023-05-13 03:28:26,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +13: [2023-05-13 03:28:26,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +13: [2023-05-13 03:28:26,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +13: [2023-05-13 03:28:26,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +13: [2023-05-13 03:28:26,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +13: [2023-05-13 03:28:26,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +13: [2023-05-13 03:28:26,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +13: [2023-05-13 03:28:26,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +13: [2023-05-13 03:28:26,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +13: [2023-05-13 03:28:26,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +13: [2023-05-13 03:28:26,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +13: [2023-05-13 03:28:26,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +13: [2023-05-13 03:28:26,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +13: [2023-05-13 03:28:26,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +13: [2023-05-13 03:28:26,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +20: [2023-05-13 03:28:26,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +20: [2023-05-13 03:28:26,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +16: [2023-05-13 03:28:26,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +16: [2023-05-13 03:28:26,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +16: [2023-05-13 03:28:26,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +11: [2023-05-13 03:28:26,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +16: [2023-05-13 03:28:26,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +16: [2023-05-13 03:28:26,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +16: [2023-05-13 03:28:26,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +16: [2023-05-13 03:28:26,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +16: [2023-05-13 03:28:26,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 4: [2023-05-13 03:28:26,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 4: [2023-05-13 03:28:26,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:26,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +10: [2023-05-13 03:28:26,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +10: [2023-05-13 03:28:26,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +10: [2023-05-13 03:28:26,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +10: [2023-05-13 03:28:26,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +10: [2023-05-13 03:28:26,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +10: [2023-05-13 03:28:26,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +10: [2023-05-13 03:28:26,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +14: [2023-05-13 03:28:26,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +14: [2023-05-13 03:28:26,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +14: [2023-05-13 03:28:26,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +11: [2023-05-13 03:28:26,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +20: [2023-05-13 03:28:26,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +20: [2023-05-13 03:28:26,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +20: [2023-05-13 03:28:26,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +10: [2023-05-13 03:28:26,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:26,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:26,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +20: [2023-05-13 03:28:26,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +20: [2023-05-13 03:28:26,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +20: [2023-05-13 03:28:26,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +16: [2023-05-13 03:28:26,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +16: [2023-05-13 03:28:26,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +20: [2023-05-13 03:28:26,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +20: [2023-05-13 03:28:26,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:26,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:26,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:26,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:26,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:26,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +14: [2023-05-13 03:28:26,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +16: [2023-05-13 03:28:26,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +11: [2023-05-13 03:28:26,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +11: [2023-05-13 03:28:26,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +11: [2023-05-13 03:28:26,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +14: [2023-05-13 03:28:26,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +14: [2023-05-13 03:28:26,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +14: [2023-05-13 03:28:26,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +14: [2023-05-13 03:28:26,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +16: [2023-05-13 03:28:26,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +11: [2023-05-13 03:28:26,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +11: [2023-05-13 03:28:26,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +11: [2023-05-13 03:28:26,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +11: [2023-05-13 03:28:26,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +16: [2023-05-13 03:28:26,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +16: [2023-05-13 03:28:26,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +16: [2023-05-13 03:28:26,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +16: [2023-05-13 03:28:26,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +14: [2023-05-13 03:28:26,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +14: [2023-05-13 03:28:26,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +14: [2023-05-13 03:28:26,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +13: [2023-05-13 03:28:26,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +13: [2023-05-13 03:28:26,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +13: [2023-05-13 03:28:26,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +20: [2023-05-13 03:28:26,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +20: [2023-05-13 03:28:26,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +20: [2023-05-13 03:28:26,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +25: [2023-05-13 03:28:26,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +25: [2023-05-13 03:28:26,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +25: [2023-05-13 03:28:26,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +25: [2023-05-13 03:28:26,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +25: [2023-05-13 03:28:26,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +25: [2023-05-13 03:28:26,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +25: [2023-05-13 03:28:26,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +25: [2023-05-13 03:28:26,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +13: [2023-05-13 03:28:26,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 3: [2023-05-13 03:28:26,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +14: [2023-05-13 03:28:26,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +20: [2023-05-13 03:28:26,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +20: [2023-05-13 03:28:26,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 3: [2023-05-13 03:28:26,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +25: [2023-05-13 03:28:26,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +13: [2023-05-13 03:28:26,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +13: [2023-05-13 03:28:26,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +25: [2023-05-13 03:28:26,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +14: [2023-05-13 03:28:26,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +14: [2023-05-13 03:28:26,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +13: [2023-05-13 03:28:26,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +13: [2023-05-13 03:28:26,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +14: [2023-05-13 03:28:26,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +28: [2023-05-13 03:28:26,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +28: [2023-05-13 03:28:26,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +28: [2023-05-13 03:28:26,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +28: [2023-05-13 03:28:26,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +28: [2023-05-13 03:28:26,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +28: [2023-05-13 03:28:26,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +28: [2023-05-13 03:28:26,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +11: [2023-05-13 03:28:26,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +25: [2023-05-13 03:28:26,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +28: [2023-05-13 03:28:26,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +20: [2023-05-13 03:28:26,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +31: [2023-05-13 03:28:26,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +11: [2023-05-13 03:28:26,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +14: [2023-05-13 03:28:26,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +31: [2023-05-13 03:28:26,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +31: [2023-05-13 03:28:26,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +31: [2023-05-13 03:28:26,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +31: [2023-05-13 03:28:26,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +31: [2023-05-13 03:28:26,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +31: [2023-05-13 03:28:26,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +31: [2023-05-13 03:28:26,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +11: [2023-05-13 03:28:26,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +25: [2023-05-13 03:28:26,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +25: [2023-05-13 03:28:26,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +25: [2023-05-13 03:28:26,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +28: [2023-05-13 03:28:26,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +25: [2023-05-13 03:28:26,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +25: [2023-05-13 03:28:26,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt... +11: [2023-05-13 03:28:26,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +31: [2023-05-13 03:28:26,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +31: [2023-05-13 03:28:26,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +11: [2023-05-13 03:28:26,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +28: [2023-05-13 03:28:26,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +13: [2023-05-13 03:28:26,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +13: [2023-05-13 03:28:26,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +11: [2023-05-13 03:28:26,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +31: [2023-05-13 03:28:26,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:26,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +10: [2023-05-13 03:28:26,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +31: [2023-05-13 03:28:26,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +11: [2023-05-13 03:28:26,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +31: [2023-05-13 03:28:26,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +28: [2023-05-13 03:28:26,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +28: [2023-05-13 03:28:26,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +31: [2023-05-13 03:28:26,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +28: [2023-05-13 03:28:26,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +31: [2023-05-13 03:28:26,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +28: [2023-05-13 03:28:26,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +31: [2023-05-13 03:28:26,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +28: [2023-05-13 03:28:26,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +28: [2023-05-13 03:28:26,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +13: [2023-05-13 03:28:26,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +10: [2023-05-13 03:28:26,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +17: [2023-05-13 03:28:26,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +17: [2023-05-13 03:28:26,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +17: [2023-05-13 03:28:26,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +17: [2023-05-13 03:28:26,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +17: [2023-05-13 03:28:26,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +17: [2023-05-13 03:28:26,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +17: [2023-05-13 03:28:26,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +17: [2023-05-13 03:28:26,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +13: [2023-05-13 03:28:26,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +13: [2023-05-13 03:28:26,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +13: [2023-05-13 03:28:26,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +13: [2023-05-13 03:28:26,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +13: [2023-05-13 03:28:26,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +17: [2023-05-13 03:28:26,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:26,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +10: [2023-05-13 03:28:26,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +17: [2023-05-13 03:28:26,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +17: [2023-05-13 03:28:26,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +17: [2023-05-13 03:28:26,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +17: [2023-05-13 03:28:26,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +17: [2023-05-13 03:28:26,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:26,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +17: [2023-05-13 03:28:26,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +17: [2023-05-13 03:28:26,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:26,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +10: [2023-05-13 03:28:26,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +10: [2023-05-13 03:28:26,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +10: [2023-05-13 03:28:26,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +10: [2023-05-13 03:28:26,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +25: [2023-05-13 03:28:26,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +28: [2023-05-13 03:28:26,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +31: [2023-05-13 03:28:26,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +31: [2023-05-13 03:28:26,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +25: [2023-05-13 03:28:26,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +25: [2023-05-13 03:28:26,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +25: [2023-05-13 03:28:26,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +25: [2023-05-13 03:28:26,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +25: [2023-05-13 03:28:26,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +25: [2023-05-13 03:28:26,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +25: [2023-05-13 03:28:26,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_13-model_00-model_states.pt. +10: [2023-05-13 03:28:26,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +10: [2023-05-13 03:28:26,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +28: [2023-05-13 03:28:26,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +28: [2023-05-13 03:28:26,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +25: [2023-05-13 03:28:26,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:26,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +10: [2023-05-13 03:28:26,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +10: [2023-05-13 03:28:26,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +31: [2023-05-13 03:28:26,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +17: [2023-05-13 03:28:26,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +31: [2023-05-13 03:28:26,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +31: [2023-05-13 03:28:26,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +31: [2023-05-13 03:28:26,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +31: [2023-05-13 03:28:26,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +31: [2023-05-13 03:28:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +31: [2023-05-13 03:28:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +31: [2023-05-13 03:28:26,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +25: [2023-05-13 03:28:26,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +25: [2023-05-13 03:28:26,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +18: [2023-05-13 03:28:26,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +18: [2023-05-13 03:28:26,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +18: [2023-05-13 03:28:26,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +18: [2023-05-13 03:28:26,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +18: [2023-05-13 03:28:26,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +18: [2023-05-13 03:28:26,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +18: [2023-05-13 03:28:26,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +18: [2023-05-13 03:28:26,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +28: [2023-05-13 03:28:26,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +18: [2023-05-13 03:28:26,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +18: [2023-05-13 03:28:26,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +28: [2023-05-13 03:28:26,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +18: [2023-05-13 03:28:26,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +18: [2023-05-13 03:28:26,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +28: [2023-05-13 03:28:26,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +28: [2023-05-13 03:28:26,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +28: [2023-05-13 03:28:26,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +28: [2023-05-13 03:28:26,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 0: [2023-05-13 03:28:26,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +18: [2023-05-13 03:28:26,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +18: [2023-05-13 03:28:26,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +18: [2023-05-13 03:28:26,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +18: [2023-05-13 03:28:26,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +28: [2023-05-13 03:28:26,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +30: [2023-05-13 03:28:26,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +30: [2023-05-13 03:28:26,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +30: [2023-05-13 03:28:26,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +30: [2023-05-13 03:28:26,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +30: [2023-05-13 03:28:26,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +30: [2023-05-13 03:28:26,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +25: [2023-05-13 03:28:26,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +30: [2023-05-13 03:28:26,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +30: [2023-05-13 03:28:26,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +25: [2023-05-13 03:28:26,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +17: [2023-05-13 03:28:26,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +25: [2023-05-13 03:28:26,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +25: [2023-05-13 03:28:26,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +25: [2023-05-13 03:28:26,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +30: [2023-05-13 03:28:26,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +30: [2023-05-13 03:28:26,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +30: [2023-05-13 03:28:26,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +30: [2023-05-13 03:28:26,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +30: [2023-05-13 03:28:26,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +30: [2023-05-13 03:28:26,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +30: [2023-05-13 03:28:26,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +17: [2023-05-13 03:28:26,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +30: [2023-05-13 03:28:26,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +17: [2023-05-13 03:28:26,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +17: [2023-05-13 03:28:26,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +17: [2023-05-13 03:28:26,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +17: [2023-05-13 03:28:26,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +17: [2023-05-13 03:28:26,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +17: [2023-05-13 03:28:26,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +28: [2023-05-13 03:28:26,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +28: [2023-05-13 03:28:26,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +28: [2023-05-13 03:28:26,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +31: [2023-05-13 03:28:26,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +31: [2023-05-13 03:28:26,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +31: [2023-05-13 03:28:26,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +31: [2023-05-13 03:28:26,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +31: [2023-05-13 03:28:26,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +31: [2023-05-13 03:28:26,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +28: [2023-05-13 03:28:26,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +17: [2023-05-13 03:28:26,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +28: [2023-05-13 03:28:26,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +28: [2023-05-13 03:28:26,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 0: [2023-05-13 03:28:26,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +18: [2023-05-13 03:28:26,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +18: [2023-05-13 03:28:26,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +18: [2023-05-13 03:28:26,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 5: [2023-05-13 03:28:26,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 5: [2023-05-13 03:28:26,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +22: [2023-05-13 03:28:26,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +22: [2023-05-13 03:28:26,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +18: [2023-05-13 03:28:26,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +22: [2023-05-13 03:28:26,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +22: [2023-05-13 03:28:26,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +22: [2023-05-13 03:28:26,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +22: [2023-05-13 03:28:26,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +22: [2023-05-13 03:28:26,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +22: [2023-05-13 03:28:26,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +22: [2023-05-13 03:28:26,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +22: [2023-05-13 03:28:26,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +18: [2023-05-13 03:28:26,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +30: [2023-05-13 03:28:26,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +30: [2023-05-13 03:28:26,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +30: [2023-05-13 03:28:26,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +30: [2023-05-13 03:28:26,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +22: [2023-05-13 03:28:26,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +22: [2023-05-13 03:28:26,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +17: [2023-05-13 03:28:26,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +17: [2023-05-13 03:28:26,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +17: [2023-05-13 03:28:26,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:26,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +22: [2023-05-13 03:28:26,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +22: [2023-05-13 03:28:26,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +22: [2023-05-13 03:28:26,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +17: [2023-05-13 03:28:26,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +17: [2023-05-13 03:28:26,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +17: [2023-05-13 03:28:26,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +30: [2023-05-13 03:28:26,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +18: [2023-05-13 03:28:26,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +18: [2023-05-13 03:28:26,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +18: [2023-05-13 03:28:26,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +18: [2023-05-13 03:28:26,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +18: [2023-05-13 03:28:26,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +18: [2023-05-13 03:28:26,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +18: [2023-05-13 03:28:26,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 8: [2023-05-13 03:28:26,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 8: [2023-05-13 03:28:26,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +30: [2023-05-13 03:28:26,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +30: [2023-05-13 03:28:26,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +30: [2023-05-13 03:28:26,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +30: [2023-05-13 03:28:26,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +30: [2023-05-13 03:28:26,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +18: [2023-05-13 03:28:26,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +30: [2023-05-13 03:28:26,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +30: [2023-05-13 03:28:26,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +23: [2023-05-13 03:28:26,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +23: [2023-05-13 03:28:26,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +23: [2023-05-13 03:28:26,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +23: [2023-05-13 03:28:26,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +23: [2023-05-13 03:28:26,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +23: [2023-05-13 03:28:26,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +23: [2023-05-13 03:28:26,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +23: [2023-05-13 03:28:26,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +30: [2023-05-13 03:28:27,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +18: [2023-05-13 03:28:27,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +18: [2023-05-13 03:28:27,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +23: [2023-05-13 03:28:27,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +23: [2023-05-13 03:28:27,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +18: [2023-05-13 03:28:27,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +23: [2023-05-13 03:28:27,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +23: [2023-05-13 03:28:27,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +23: [2023-05-13 03:28:27,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +23: [2023-05-13 03:28:27,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +23: [2023-05-13 03:28:27,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +23: [2023-05-13 03:28:27,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +30: [2023-05-13 03:28:27,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +30: [2023-05-13 03:28:27,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +30: [2023-05-13 03:28:27,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +22: [2023-05-13 03:28:27,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +22: [2023-05-13 03:28:27,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:27,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +19: [2023-05-13 03:28:27,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +19: [2023-05-13 03:28:27,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +19: [2023-05-13 03:28:27,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +19: [2023-05-13 03:28:27,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +19: [2023-05-13 03:28:27,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +19: [2023-05-13 03:28:27,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +19: [2023-05-13 03:28:27,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +19: [2023-05-13 03:28:27,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:27,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +22: [2023-05-13 03:28:27,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +19: [2023-05-13 03:28:27,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +27: [2023-05-13 03:28:27,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +27: [2023-05-13 03:28:27,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +27: [2023-05-13 03:28:27,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +27: [2023-05-13 03:28:27,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +27: [2023-05-13 03:28:27,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +27: [2023-05-13 03:28:27,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +27: [2023-05-13 03:28:27,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +19: [2023-05-13 03:28:27,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +27: [2023-05-13 03:28:27,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +19: [2023-05-13 03:28:27,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +19: [2023-05-13 03:28:27,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +19: [2023-05-13 03:28:27,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +19: [2023-05-13 03:28:27,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +19: [2023-05-13 03:28:27,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +19: [2023-05-13 03:28:27,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +27: [2023-05-13 03:28:27,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:27,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:27,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +22: [2023-05-13 03:28:27,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +22: [2023-05-13 03:28:27,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +22: [2023-05-13 03:28:27,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +27: [2023-05-13 03:28:27,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +27: [2023-05-13 03:28:27,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +27: [2023-05-13 03:28:27,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +27: [2023-05-13 03:28:27,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +27: [2023-05-13 03:28:27,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +27: [2023-05-13 03:28:27,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +27: [2023-05-13 03:28:27,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +12: [2023-05-13 03:28:27,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +12: [2023-05-13 03:28:27,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +12: [2023-05-13 03:28:27,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +23: [2023-05-13 03:28:27,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +23: [2023-05-13 03:28:27,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +12: [2023-05-13 03:28:27,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +12: [2023-05-13 03:28:27,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +12: [2023-05-13 03:28:27,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +12: [2023-05-13 03:28:27,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +12: [2023-05-13 03:28:27,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +22: [2023-05-13 03:28:27,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +12: [2023-05-13 03:28:27,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +12: [2023-05-13 03:28:27,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +12: [2023-05-13 03:28:27,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +12: [2023-05-13 03:28:27,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +12: [2023-05-13 03:28:27,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +12: [2023-05-13 03:28:27,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:27,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +12: [2023-05-13 03:28:27,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +12: [2023-05-13 03:28:27,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:27,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +14: [2023-05-13 03:28:27,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +14: [2023-05-13 03:28:27,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +14: [2023-05-13 03:28:27,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +14: [2023-05-13 03:28:27,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +14: [2023-05-13 03:28:27,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +14: [2023-05-13 03:28:27,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +14: [2023-05-13 03:28:27,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +14: [2023-05-13 03:28:27,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +11: [2023-05-13 03:28:27,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +11: [2023-05-13 03:28:27,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +11: [2023-05-13 03:28:27,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +11: [2023-05-13 03:28:27,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +11: [2023-05-13 03:28:27,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +11: [2023-05-13 03:28:27,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +11: [2023-05-13 03:28:27,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +11: [2023-05-13 03:28:27,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +11: [2023-05-13 03:28:27,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +14: [2023-05-13 03:28:27,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +14: [2023-05-13 03:28:27,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +14: [2023-05-13 03:28:27,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +14: [2023-05-13 03:28:27,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +14: [2023-05-13 03:28:27,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:27,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +14: [2023-05-13 03:28:27,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +14: [2023-05-13 03:28:27,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:27,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:27,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +14: [2023-05-13 03:28:27,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +23: [2023-05-13 03:28:27,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +23: [2023-05-13 03:28:27,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +23: [2023-05-13 03:28:27,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +23: [2023-05-13 03:28:27,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +23: [2023-05-13 03:28:27,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +23: [2023-05-13 03:28:27,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +23: [2023-05-13 03:28:27,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +23: [2023-05-13 03:28:27,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +11: [2023-05-13 03:28:27,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +11: [2023-05-13 03:28:27,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +11: [2023-05-13 03:28:27,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +11: [2023-05-13 03:28:27,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +11: [2023-05-13 03:28:27,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +11: [2023-05-13 03:28:27,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +11: [2023-05-13 03:28:27,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +13: [2023-05-13 03:28:27,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +13: [2023-05-13 03:28:27,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +13: [2023-05-13 03:28:27,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +13: [2023-05-13 03:28:27,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +13: [2023-05-13 03:28:27,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +13: [2023-05-13 03:28:27,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +13: [2023-05-13 03:28:27,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +13: [2023-05-13 03:28:27,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +19: [2023-05-13 03:28:27,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +19: [2023-05-13 03:28:27,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +19: [2023-05-13 03:28:27,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +27: [2023-05-13 03:28:27,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +19: [2023-05-13 03:28:27,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +19: [2023-05-13 03:28:27,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +13: [2023-05-13 03:28:27,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +13: [2023-05-13 03:28:27,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +13: [2023-05-13 03:28:27,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +13: [2023-05-13 03:28:27,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +13: [2023-05-13 03:28:27,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +13: [2023-05-13 03:28:27,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +13: [2023-05-13 03:28:27,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +13: [2023-05-13 03:28:27,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +23: [2023-05-13 03:28:27,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +28: [2023-05-13 03:28:27,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +23: [2023-05-13 03:28:27,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +28: [2023-05-13 03:28:27,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +28: [2023-05-13 03:28:27,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +28: [2023-05-13 03:28:27,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +28: [2023-05-13 03:28:27,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +28: [2023-05-13 03:28:27,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +28: [2023-05-13 03:28:27,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +28: [2023-05-13 03:28:27,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +23: [2023-05-13 03:28:27,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +23: [2023-05-13 03:28:27,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +28: [2023-05-13 03:28:27,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +23: [2023-05-13 03:28:27,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +19: [2023-05-13 03:28:27,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +19: [2023-05-13 03:28:27,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +19: [2023-05-13 03:28:27,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +23: [2023-05-13 03:28:27,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +12: [2023-05-13 03:28:27,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +12: [2023-05-13 03:28:27,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +28: [2023-05-13 03:28:27,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +27: [2023-05-13 03:28:27,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +11: [2023-05-13 03:28:27,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +12: [2023-05-13 03:28:27,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +28: [2023-05-13 03:28:27,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +28: [2023-05-13 03:28:27,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +28: [2023-05-13 03:28:27,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +28: [2023-05-13 03:28:27,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +29: [2023-05-13 03:28:27,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +29: [2023-05-13 03:28:27,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +29: [2023-05-13 03:28:27,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +29: [2023-05-13 03:28:27,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +28: [2023-05-13 03:28:27,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +28: [2023-05-13 03:28:27,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +29: [2023-05-13 03:28:27,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +29: [2023-05-13 03:28:27,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +29: [2023-05-13 03:28:27,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +29: [2023-05-13 03:28:27,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +27: [2023-05-13 03:28:27,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +29: [2023-05-13 03:28:27,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +19: [2023-05-13 03:28:27,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +29: [2023-05-13 03:28:27,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +19: [2023-05-13 03:28:27,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +12: [2023-05-13 03:28:27,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +12: [2023-05-13 03:28:27,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +12: [2023-05-13 03:28:27,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +12: [2023-05-13 03:28:27,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +12: [2023-05-13 03:28:27,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +27: [2023-05-13 03:28:27,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +19: [2023-05-13 03:28:27,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +14: [2023-05-13 03:28:27,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +14: [2023-05-13 03:28:27,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +14: [2023-05-13 03:28:27,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +14: [2023-05-13 03:28:27,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +27: [2023-05-13 03:28:27,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +29: [2023-05-13 03:28:27,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +19: [2023-05-13 03:28:27,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +19: [2023-05-13 03:28:27,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +29: [2023-05-13 03:28:27,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +29: [2023-05-13 03:28:27,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +29: [2023-05-13 03:28:27,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +29: [2023-05-13 03:28:27,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +29: [2023-05-13 03:28:27,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +24: [2023-05-13 03:28:27,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +24: [2023-05-13 03:28:27,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +24: [2023-05-13 03:28:27,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +24: [2023-05-13 03:28:27,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +24: [2023-05-13 03:28:27,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +24: [2023-05-13 03:28:27,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +24: [2023-05-13 03:28:27,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +24: [2023-05-13 03:28:27,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +14: [2023-05-13 03:28:27,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +24: [2023-05-13 03:28:27,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +24: [2023-05-13 03:28:27,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +11: [2023-05-13 03:28:27,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +12: [2023-05-13 03:28:27,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +24: [2023-05-13 03:28:27,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +19: [2023-05-13 03:28:27,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +14: [2023-05-13 03:28:27,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +14: [2023-05-13 03:28:27,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +14: [2023-05-13 03:28:27,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +12: [2023-05-13 03:28:27,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +19: [2023-05-13 03:28:27,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +19: [2023-05-13 03:28:27,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +27: [2023-05-13 03:28:27,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +24: [2023-05-13 03:28:27,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +24: [2023-05-13 03:28:27,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +24: [2023-05-13 03:28:27,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +24: [2023-05-13 03:28:27,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +24: [2023-05-13 03:28:27,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +27: [2023-05-13 03:28:27,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +27: [2023-05-13 03:28:27,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +27: [2023-05-13 03:28:27,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +27: [2023-05-13 03:28:27,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +11: [2023-05-13 03:28:27,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +11: [2023-05-13 03:28:27,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +11: [2023-05-13 03:28:27,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +13: [2023-05-13 03:28:27,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +13: [2023-05-13 03:28:27,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +12: [2023-05-13 03:28:27,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +13: [2023-05-13 03:28:27,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +11: [2023-05-13 03:28:27,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +11: [2023-05-13 03:28:27,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +11: [2023-05-13 03:28:27,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +11: [2023-05-13 03:28:27,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +27: [2023-05-13 03:28:27,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +12: [2023-05-13 03:28:27,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +15: [2023-05-13 03:28:27,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +28: [2023-05-13 03:28:27,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +15: [2023-05-13 03:28:27,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +15: [2023-05-13 03:28:27,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +15: [2023-05-13 03:28:27,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +15: [2023-05-13 03:28:27,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +15: [2023-05-13 03:28:27,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +14: [2023-05-13 03:28:27,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +15: [2023-05-13 03:28:27,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +15: [2023-05-13 03:28:27,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +13: [2023-05-13 03:28:27,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +12: [2023-05-13 03:28:27,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +14: [2023-05-13 03:28:27,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +27: [2023-05-13 03:28:27,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +15: [2023-05-13 03:28:27,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +14: [2023-05-13 03:28:27,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +14: [2023-05-13 03:28:27,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +26: [2023-05-13 03:28:27,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +26: [2023-05-13 03:28:27,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +12: [2023-05-13 03:28:27,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +12: [2023-05-13 03:28:27,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +12: [2023-05-13 03:28:27,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +26: [2023-05-13 03:28:27,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +13: [2023-05-13 03:28:27,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +13: [2023-05-13 03:28:27,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +13: [2023-05-13 03:28:27,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +26: [2023-05-13 03:28:27,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +26: [2023-05-13 03:28:27,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +26: [2023-05-13 03:28:27,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +26: [2023-05-13 03:28:27,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +26: [2023-05-13 03:28:27,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +13: [2023-05-13 03:28:27,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +29: [2023-05-13 03:28:27,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +26: [2023-05-13 03:28:27,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +26: [2023-05-13 03:28:27,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +15: [2023-05-13 03:28:27,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +26: [2023-05-13 03:28:27,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +20: [2023-05-13 03:28:27,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +20: [2023-05-13 03:28:27,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +15: [2023-05-13 03:28:27,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +15: [2023-05-13 03:28:27,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +15: [2023-05-13 03:28:27,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +21: [2023-05-13 03:28:27,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +21: [2023-05-13 03:28:27,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +15: [2023-05-13 03:28:27,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +13: [2023-05-13 03:28:27,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +14: [2023-05-13 03:28:27,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +14: [2023-05-13 03:28:27,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +15: [2023-05-13 03:28:27,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +20: [2023-05-13 03:28:27,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +20: [2023-05-13 03:28:27,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +20: [2023-05-13 03:28:27,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +20: [2023-05-13 03:28:27,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +20: [2023-05-13 03:28:27,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +15: [2023-05-13 03:28:27,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +20: [2023-05-13 03:28:27,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +21: [2023-05-13 03:28:27,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +13: [2023-05-13 03:28:27,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +21: [2023-05-13 03:28:27,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +21: [2023-05-13 03:28:27,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +16: [2023-05-13 03:28:27,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +16: [2023-05-13 03:28:27,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +21: [2023-05-13 03:28:27,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +21: [2023-05-13 03:28:27,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +21: [2023-05-13 03:28:27,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +29: [2023-05-13 03:28:27,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +14: [2023-05-13 03:28:27,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +26: [2023-05-13 03:28:27,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +16: [2023-05-13 03:28:27,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +26: [2023-05-13 03:28:27,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +26: [2023-05-13 03:28:27,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +16: [2023-05-13 03:28:27,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +26: [2023-05-13 03:28:27,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +16: [2023-05-13 03:28:27,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +16: [2023-05-13 03:28:27,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +16: [2023-05-13 03:28:27,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +14: [2023-05-13 03:28:27,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +16: [2023-05-13 03:28:27,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +26: [2023-05-13 03:28:27,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +20: [2023-05-13 03:28:27,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +20: [2023-05-13 03:28:27,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +21: [2023-05-13 03:28:27,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +21: [2023-05-13 03:28:27,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +28: [2023-05-13 03:28:27,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +21: [2023-05-13 03:28:27,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +28: [2023-05-13 03:28:27,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +16: [2023-05-13 03:28:27,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +27: [2023-05-13 03:28:27,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +16: [2023-05-13 03:28:27,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +13: [2023-05-13 03:28:27,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +16: [2023-05-13 03:28:27,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +20: [2023-05-13 03:28:27,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +16: [2023-05-13 03:28:27,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +20: [2023-05-13 03:28:27,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +16: [2023-05-13 03:28:27,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +20: [2023-05-13 03:28:27,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +16: [2023-05-13 03:28:27,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +21: [2023-05-13 03:28:27,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +20: [2023-05-13 03:28:27,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +21: [2023-05-13 03:28:27,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +20: [2023-05-13 03:28:27,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +16: [2023-05-13 03:28:27,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +20: [2023-05-13 03:28:27,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +21: [2023-05-13 03:28:27,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +27: [2023-05-13 03:28:27,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +10: [2023-05-13 03:28:27,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +10: [2023-05-13 03:28:27,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +10: [2023-05-13 03:28:27,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +16: [2023-05-13 03:28:27,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +21: [2023-05-13 03:28:27,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:27,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +10: [2023-05-13 03:28:27,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +27: [2023-05-13 03:28:27,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +27: [2023-05-13 03:28:27,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +10: [2023-05-13 03:28:27,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +10: [2023-05-13 03:28:27,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +21: [2023-05-13 03:28:27,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:27,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +11: [2023-05-13 03:28:27,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +11: [2023-05-13 03:28:27,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +11: [2023-05-13 03:28:27,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +10: [2023-05-13 03:28:27,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +10: [2023-05-13 03:28:27,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +11: [2023-05-13 03:28:27,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +13: [2023-05-13 03:28:27,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +31: [2023-05-13 03:28:27,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +31: [2023-05-13 03:28:27,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +29: [2023-05-13 03:28:27,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +31: [2023-05-13 03:28:27,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +31: [2023-05-13 03:28:27,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +31: [2023-05-13 03:28:27,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +31: [2023-05-13 03:28:27,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +31: [2023-05-13 03:28:27,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +31: [2023-05-13 03:28:27,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +11: [2023-05-13 03:28:27,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +11: [2023-05-13 03:28:27,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +28: [2023-05-13 03:28:27,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +28: [2023-05-13 03:28:27,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +28: [2023-05-13 03:28:27,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +11: [2023-05-13 03:28:27,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +24: [2023-05-13 03:28:27,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +24: [2023-05-13 03:28:27,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:27,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +10: [2023-05-13 03:28:27,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +10: [2023-05-13 03:28:27,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +31: [2023-05-13 03:28:27,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:27,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +31: [2023-05-13 03:28:27,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +10: [2023-05-13 03:28:27,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +10: [2023-05-13 03:28:27,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +29: [2023-05-13 03:28:27,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +13: [2023-05-13 03:28:27,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +13: [2023-05-13 03:28:27,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +24: [2023-05-13 03:28:27,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +13: [2023-05-13 03:28:27,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +13: [2023-05-13 03:28:27,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +29: [2023-05-13 03:28:27,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +29: [2023-05-13 03:28:27,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +28: [2023-05-13 03:28:27,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +28: [2023-05-13 03:28:27,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +28: [2023-05-13 03:28:27,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +31: [2023-05-13 03:28:27,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +31: [2023-05-13 03:28:27,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +31: [2023-05-13 03:28:27,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +31: [2023-05-13 03:28:27,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +31: [2023-05-13 03:28:27,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +31: [2023-05-13 03:28:27,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +28: [2023-05-13 03:28:27,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +29: [2023-05-13 03:28:27,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +29: [2023-05-13 03:28:27,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +15: [2023-05-13 03:28:27,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +24: [2023-05-13 03:28:27,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +24: [2023-05-13 03:28:27,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +24: [2023-05-13 03:28:27,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +24: [2023-05-13 03:28:27,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +24: [2023-05-13 03:28:27,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +30: [2023-05-13 03:28:27,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +30: [2023-05-13 03:28:27,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +30: [2023-05-13 03:28:27,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +30: [2023-05-13 03:28:27,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +30: [2023-05-13 03:28:27,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +30: [2023-05-13 03:28:27,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +30: [2023-05-13 03:28:27,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +30: [2023-05-13 03:28:27,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +28: [2023-05-13 03:28:27,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +24: [2023-05-13 03:28:27,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +28: [2023-05-13 03:28:27,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +24: [2023-05-13 03:28:27,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +28: [2023-05-13 03:28:27,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +30: [2023-05-13 03:28:27,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +30: [2023-05-13 03:28:27,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +30: [2023-05-13 03:28:27,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +30: [2023-05-13 03:28:27,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +30: [2023-05-13 03:28:27,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +30: [2023-05-13 03:28:27,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +26: [2023-05-13 03:28:27,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +26: [2023-05-13 03:28:27,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +26: [2023-05-13 03:28:27,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +30: [2023-05-13 03:28:27,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +26: [2023-05-13 03:28:27,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +24: [2023-05-13 03:28:27,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +30: [2023-05-13 03:28:27,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +25: [2023-05-13 03:28:27,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +25: [2023-05-13 03:28:27,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +25: [2023-05-13 03:28:27,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +25: [2023-05-13 03:28:27,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +28: [2023-05-13 03:28:27,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +25: [2023-05-13 03:28:27,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +25: [2023-05-13 03:28:27,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +25: [2023-05-13 03:28:27,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +15: [2023-05-13 03:28:27,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +24: [2023-05-13 03:28:27,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +28: [2023-05-13 03:28:27,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +28: [2023-05-13 03:28:27,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +20: [2023-05-13 03:28:27,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +20: [2023-05-13 03:28:27,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +21: [2023-05-13 03:28:27,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +21: [2023-05-13 03:28:27,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +21: [2023-05-13 03:28:27,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +16: [2023-05-13 03:28:27,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +29: [2023-05-13 03:28:27,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +29: [2023-05-13 03:28:27,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +25: [2023-05-13 03:28:27,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +24: [2023-05-13 03:28:27,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +25: [2023-05-13 03:28:27,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +24: [2023-05-13 03:28:27,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +25: [2023-05-13 03:28:27,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +25: [2023-05-13 03:28:27,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +29: [2023-05-13 03:28:27,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +29: [2023-05-13 03:28:27,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +25: [2023-05-13 03:28:27,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +24: [2023-05-13 03:28:27,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +24: [2023-05-13 03:28:27,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +26: [2023-05-13 03:28:27,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +26: [2023-05-13 03:28:27,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +29: [2023-05-13 03:28:27,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +25: [2023-05-13 03:28:27,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +25: [2023-05-13 03:28:27,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... +25: [2023-05-13 03:28:27,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +10: [2023-05-13 03:28:27,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +10: [2023-05-13 03:28:27,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +26: [2023-05-13 03:28:27,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +26: [2023-05-13 03:28:27,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +16: [2023-05-13 03:28:27,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +16: [2023-05-13 03:28:27,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +16: [2023-05-13 03:28:27,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +16: [2023-05-13 03:28:27,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +16: [2023-05-13 03:28:27,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +21: [2023-05-13 03:28:27,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +21: [2023-05-13 03:28:27,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +16: [2023-05-13 03:28:27,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +16: [2023-05-13 03:28:27,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +31: [2023-05-13 03:28:27,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +31: [2023-05-13 03:28:27,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +15: [2023-05-13 03:28:27,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +15: [2023-05-13 03:28:27,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +15: [2023-05-13 03:28:27,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +15: [2023-05-13 03:28:27,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +15: [2023-05-13 03:28:27,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +15: [2023-05-13 03:28:27,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +15: [2023-05-13 03:28:27,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +21: [2023-05-13 03:28:27,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +21: [2023-05-13 03:28:27,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +21: [2023-05-13 03:28:27,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +26: [2023-05-13 03:28:27,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +26: [2023-05-13 03:28:27,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +26: [2023-05-13 03:28:27,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +26: [2023-05-13 03:28:27,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +20: [2023-05-13 03:28:27,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +20: [2023-05-13 03:28:27,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +20: [2023-05-13 03:28:27,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +20: [2023-05-13 03:28:27,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +20: [2023-05-13 03:28:27,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +20: [2023-05-13 03:28:27,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +21: [2023-05-13 03:28:27,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +16: [2023-05-13 03:28:27,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +21: [2023-05-13 03:28:27,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +20: [2023-05-13 03:28:27,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +21: [2023-05-13 03:28:27,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +20: [2023-05-13 03:28:27,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:27,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +22: [2023-05-13 03:28:27,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +22: [2023-05-13 03:28:27,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +22: [2023-05-13 03:28:27,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +22: [2023-05-13 03:28:27,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +22: [2023-05-13 03:28:27,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +22: [2023-05-13 03:28:27,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +22: [2023-05-13 03:28:27,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +10: [2023-05-13 03:28:27,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +10: [2023-05-13 03:28:27,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:27,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:27,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +16: [2023-05-13 03:28:27,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +10: [2023-05-13 03:28:27,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +10: [2023-05-13 03:28:27,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +10: [2023-05-13 03:28:27,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +10: [2023-05-13 03:28:27,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +10: [2023-05-13 03:28:27,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +10: [2023-05-13 03:28:27,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +26: [2023-05-13 03:28:27,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +26: [2023-05-13 03:28:27,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +26: [2023-05-13 03:28:27,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +21: [2023-05-13 03:28:27,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +16: [2023-05-13 03:28:27,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +26: [2023-05-13 03:28:27,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:27,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:27,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:27,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:27,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:27,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +31: [2023-05-13 03:28:27,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +31: [2023-05-13 03:28:27,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +21: [2023-05-13 03:28:27,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:27,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +16: [2023-05-13 03:28:27,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +16: [2023-05-13 03:28:27,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +16: [2023-05-13 03:28:27,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +16: [2023-05-13 03:28:27,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +31: [2023-05-13 03:28:27,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +31: [2023-05-13 03:28:27,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +31: [2023-05-13 03:28:27,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +31: [2023-05-13 03:28:27,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +31: [2023-05-13 03:28:27,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +31: [2023-05-13 03:28:27,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +16: [2023-05-13 03:28:27,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +21: [2023-05-13 03:28:27,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +21: [2023-05-13 03:28:27,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +21: [2023-05-13 03:28:27,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +30: [2023-05-13 03:28:27,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +30: [2023-05-13 03:28:27,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +30: [2023-05-13 03:28:27,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +15: [2023-05-13 03:28:27,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +15: [2023-05-13 03:28:27,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +15: [2023-05-13 03:28:27,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +15: [2023-05-13 03:28:27,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +15: [2023-05-13 03:28:27,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +15: [2023-05-13 03:28:27,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +15: [2023-05-13 03:28:27,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +20: [2023-05-13 03:28:27,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +20: [2023-05-13 03:28:27,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +30: [2023-05-13 03:28:27,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +30: [2023-05-13 03:28:27,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +30: [2023-05-13 03:28:27,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +30: [2023-05-13 03:28:27,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +30: [2023-05-13 03:28:27,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +20: [2023-05-13 03:28:27,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +20: [2023-05-13 03:28:27,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +20: [2023-05-13 03:28:27,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +20: [2023-05-13 03:28:27,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +25: [2023-05-13 03:28:27,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +25: [2023-05-13 03:28:27,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +25: [2023-05-13 03:28:27,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +25: [2023-05-13 03:28:27,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +10: [2023-05-13 03:28:27,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +10: [2023-05-13 03:28:27,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +10: [2023-05-13 03:28:27,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +10: [2023-05-13 03:28:27,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +30: [2023-05-13 03:28:27,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +10: [2023-05-13 03:28:27,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +10: [2023-05-13 03:28:27,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +30: [2023-05-13 03:28:27,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +30: [2023-05-13 03:28:27,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +25: [2023-05-13 03:28:27,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. +25: [2023-05-13 03:28:27,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_14-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +31: [2023-05-13 03:28:27,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +31: [2023-05-13 03:28:27,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +31: [2023-05-13 03:28:27,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +31: [2023-05-13 03:28:27,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +31: [2023-05-13 03:28:27,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +31: [2023-05-13 03:28:27,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +30: [2023-05-13 03:28:27,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +30: [2023-05-13 03:28:27,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +25: [2023-05-13 03:28:27,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +25: [2023-05-13 03:28:27,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +30: [2023-05-13 03:28:27,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +18: [2023-05-13 03:28:27,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +18: [2023-05-13 03:28:27,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +30: [2023-05-13 03:28:27,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +22: [2023-05-13 03:28:27,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +30: [2023-05-13 03:28:27,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +18: [2023-05-13 03:28:27,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +18: [2023-05-13 03:28:27,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +22: [2023-05-13 03:28:27,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +18: [2023-05-13 03:28:27,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +18: [2023-05-13 03:28:27,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +18: [2023-05-13 03:28:27,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +18: [2023-05-13 03:28:27,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +18: [2023-05-13 03:28:27,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +18: [2023-05-13 03:28:27,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +18: [2023-05-13 03:28:27,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +18: [2023-05-13 03:28:27,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +18: [2023-05-13 03:28:27,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +19: [2023-05-13 03:28:27,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +19: [2023-05-13 03:28:27,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +19: [2023-05-13 03:28:27,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +19: [2023-05-13 03:28:27,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +19: [2023-05-13 03:28:27,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +19: [2023-05-13 03:28:27,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +19: [2023-05-13 03:28:27,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +18: [2023-05-13 03:28:27,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +19: [2023-05-13 03:28:27,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +18: [2023-05-13 03:28:27,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +17: [2023-05-13 03:28:27,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +18: [2023-05-13 03:28:27,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +17: [2023-05-13 03:28:27,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +17: [2023-05-13 03:28:27,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +17: [2023-05-13 03:28:27,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +17: [2023-05-13 03:28:27,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +17: [2023-05-13 03:28:27,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +17: [2023-05-13 03:28:27,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +17: [2023-05-13 03:28:27,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +22: [2023-05-13 03:28:27,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +17: [2023-05-13 03:28:27,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +19: [2023-05-13 03:28:27,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +19: [2023-05-13 03:28:27,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +19: [2023-05-13 03:28:27,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +19: [2023-05-13 03:28:27,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +25: [2023-05-13 03:28:27,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +19: [2023-05-13 03:28:27,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +19: [2023-05-13 03:28:27,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +19: [2023-05-13 03:28:27,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +19: [2023-05-13 03:28:27,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +25: [2023-05-13 03:28:27,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:27,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +22: [2023-05-13 03:28:27,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +17: [2023-05-13 03:28:27,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:27,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +22: [2023-05-13 03:28:27,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +22: [2023-05-13 03:28:27,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +17: [2023-05-13 03:28:27,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +17: [2023-05-13 03:28:27,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +17: [2023-05-13 03:28:27,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +17: [2023-05-13 03:28:27,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +17: [2023-05-13 03:28:27,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +17: [2023-05-13 03:28:27,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:27,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +22: [2023-05-13 03:28:27,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +22: [2023-05-13 03:28:27,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +27: [2023-05-13 03:28:27,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +27: [2023-05-13 03:28:27,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +27: [2023-05-13 03:28:27,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +27: [2023-05-13 03:28:27,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +27: [2023-05-13 03:28:27,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +27: [2023-05-13 03:28:27,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +27: [2023-05-13 03:28:27,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +27: [2023-05-13 03:28:27,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +22: [2023-05-13 03:28:27,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +22: [2023-05-13 03:28:27,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +27: [2023-05-13 03:28:27,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +22: [2023-05-13 03:28:27,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +22: [2023-05-13 03:28:27,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +22: [2023-05-13 03:28:27,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +18: [2023-05-13 03:28:27,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +18: [2023-05-13 03:28:27,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +18: [2023-05-13 03:28:27,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +27: [2023-05-13 03:28:27,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +27: [2023-05-13 03:28:27,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +27: [2023-05-13 03:28:27,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +27: [2023-05-13 03:28:27,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +27: [2023-05-13 03:28:27,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +27: [2023-05-13 03:28:27,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +27: [2023-05-13 03:28:27,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +17: [2023-05-13 03:28:27,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +18: [2023-05-13 03:28:27,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +19: [2023-05-13 03:28:27,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +19: [2023-05-13 03:28:27,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +18: [2023-05-13 03:28:27,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +18: [2023-05-13 03:28:27,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +18: [2023-05-13 03:28:27,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +18: [2023-05-13 03:28:27,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +19: [2023-05-13 03:28:27,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +18: [2023-05-13 03:28:27,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +18: [2023-05-13 03:28:27,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +19: [2023-05-13 03:28:27,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +19: [2023-05-13 03:28:27,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +19: [2023-05-13 03:28:27,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +19: [2023-05-13 03:28:27,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +19: [2023-05-13 03:28:27,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +17: [2023-05-13 03:28:27,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +18: [2023-05-13 03:28:27,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +17: [2023-05-13 03:28:27,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +18: [2023-05-13 03:28:27,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +29: [2023-05-13 03:28:27,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +29: [2023-05-13 03:28:27,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +29: [2023-05-13 03:28:27,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +29: [2023-05-13 03:28:27,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +17: [2023-05-13 03:28:27,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +17: [2023-05-13 03:28:27,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +17: [2023-05-13 03:28:27,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +29: [2023-05-13 03:28:27,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +29: [2023-05-13 03:28:27,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +29: [2023-05-13 03:28:27,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +29: [2023-05-13 03:28:27,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +18: [2023-05-13 03:28:27,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +18: [2023-05-13 03:28:27,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +19: [2023-05-13 03:28:27,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +19: [2023-05-13 03:28:27,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +18: [2023-05-13 03:28:27,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +18: [2023-05-13 03:28:27,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +27: [2023-05-13 03:28:27,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +19: [2023-05-13 03:28:27,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +17: [2023-05-13 03:28:27,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +29: [2023-05-13 03:28:27,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +29: [2023-05-13 03:28:27,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +29: [2023-05-13 03:28:27,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +29: [2023-05-13 03:28:27,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +29: [2023-05-13 03:28:27,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +29: [2023-05-13 03:28:27,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +19: [2023-05-13 03:28:27,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +19: [2023-05-13 03:28:27,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +19: [2023-05-13 03:28:27,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +17: [2023-05-13 03:28:27,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +19: [2023-05-13 03:28:27,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +19: [2023-05-13 03:28:27,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +17: [2023-05-13 03:28:27,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +12: [2023-05-13 03:28:27,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +12: [2023-05-13 03:28:27,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +12: [2023-05-13 03:28:27,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +12: [2023-05-13 03:28:27,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +12: [2023-05-13 03:28:27,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +12: [2023-05-13 03:28:27,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +12: [2023-05-13 03:28:27,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +12: [2023-05-13 03:28:27,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +17: [2023-05-13 03:28:27,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +15: [2023-05-13 03:28:27,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +15: [2023-05-13 03:28:27,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +15: [2023-05-13 03:28:27,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +15: [2023-05-13 03:28:27,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +15: [2023-05-13 03:28:27,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +15: [2023-05-13 03:28:27,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +15: [2023-05-13 03:28:27,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +15: [2023-05-13 03:28:27,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +27: [2023-05-13 03:28:27,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +17: [2023-05-13 03:28:27,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +17: [2023-05-13 03:28:27,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +15: [2023-05-13 03:28:27,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +12: [2023-05-13 03:28:27,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +12: [2023-05-13 03:28:27,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +12: [2023-05-13 03:28:27,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +12: [2023-05-13 03:28:27,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +12: [2023-05-13 03:28:27,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +12: [2023-05-13 03:28:27,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +12: [2023-05-13 03:28:27,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +12: [2023-05-13 03:28:27,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +17: [2023-05-13 03:28:27,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +15: [2023-05-13 03:28:27,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +15: [2023-05-13 03:28:27,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +27: [2023-05-13 03:28:27,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +27: [2023-05-13 03:28:27,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +15: [2023-05-13 03:28:27,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +15: [2023-05-13 03:28:27,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +15: [2023-05-13 03:28:27,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +15: [2023-05-13 03:28:27,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +15: [2023-05-13 03:28:27,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +27: [2023-05-13 03:28:27,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +20: [2023-05-13 03:28:27,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +20: [2023-05-13 03:28:27,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +17: [2023-05-13 03:28:27,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +17: [2023-05-13 03:28:27,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +17: [2023-05-13 03:28:27,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +20: [2023-05-13 03:28:27,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +20: [2023-05-13 03:28:27,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +20: [2023-05-13 03:28:27,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +20: [2023-05-13 03:28:27,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +20: [2023-05-13 03:28:27,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +20: [2023-05-13 03:28:27,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +20: [2023-05-13 03:28:27,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +20: [2023-05-13 03:28:27,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +26: [2023-05-13 03:28:27,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +26: [2023-05-13 03:28:27,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +26: [2023-05-13 03:28:27,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +26: [2023-05-13 03:28:27,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +26: [2023-05-13 03:28:27,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +26: [2023-05-13 03:28:27,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +26: [2023-05-13 03:28:27,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +26: [2023-05-13 03:28:27,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +27: [2023-05-13 03:28:27,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +27: [2023-05-13 03:28:27,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +27: [2023-05-13 03:28:27,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +27: [2023-05-13 03:28:27,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +20: [2023-05-13 03:28:27,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +20: [2023-05-13 03:28:27,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +26: [2023-05-13 03:28:27,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +26: [2023-05-13 03:28:27,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +29: [2023-05-13 03:28:27,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +20: [2023-05-13 03:28:27,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +26: [2023-05-13 03:28:27,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +20: [2023-05-13 03:28:27,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +20: [2023-05-13 03:28:27,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +20: [2023-05-13 03:28:27,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +27: [2023-05-13 03:28:27,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +27: [2023-05-13 03:28:27,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +26: [2023-05-13 03:28:27,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +26: [2023-05-13 03:28:27,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +26: [2023-05-13 03:28:27,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +16: [2023-05-13 03:28:27,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +16: [2023-05-13 03:28:27,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +14: [2023-05-13 03:28:27,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +14: [2023-05-13 03:28:27,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +14: [2023-05-13 03:28:27,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +14: [2023-05-13 03:28:27,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +26: [2023-05-13 03:28:27,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +14: [2023-05-13 03:28:27,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +14: [2023-05-13 03:28:27,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +14: [2023-05-13 03:28:27,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +26: [2023-05-13 03:28:27,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +14: [2023-05-13 03:28:27,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +11: [2023-05-13 03:28:27,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +11: [2023-05-13 03:28:27,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +11: [2023-05-13 03:28:27,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +11: [2023-05-13 03:28:27,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +11: [2023-05-13 03:28:27,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +11: [2023-05-13 03:28:27,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +11: [2023-05-13 03:28:27,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +11: [2023-05-13 03:28:27,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +16: [2023-05-13 03:28:27,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +16: [2023-05-13 03:28:27,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +16: [2023-05-13 03:28:27,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +16: [2023-05-13 03:28:27,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +16: [2023-05-13 03:28:27,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +29: [2023-05-13 03:28:27,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +16: [2023-05-13 03:28:27,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +24: [2023-05-13 03:28:27,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +24: [2023-05-13 03:28:27,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +24: [2023-05-13 03:28:27,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +24: [2023-05-13 03:28:27,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +24: [2023-05-13 03:28:27,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +24: [2023-05-13 03:28:27,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +24: [2023-05-13 03:28:27,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +24: [2023-05-13 03:28:27,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +16: [2023-05-13 03:28:27,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +11: [2023-05-13 03:28:27,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +16: [2023-05-13 03:28:27,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +14: [2023-05-13 03:28:27,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +14: [2023-05-13 03:28:27,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +14: [2023-05-13 03:28:27,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +13: [2023-05-13 03:28:27,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +13: [2023-05-13 03:28:27,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +13: [2023-05-13 03:28:27,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +13: [2023-05-13 03:28:27,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +13: [2023-05-13 03:28:27,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +13: [2023-05-13 03:28:27,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +13: [2023-05-13 03:28:27,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +16: [2023-05-13 03:28:27,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +14: [2023-05-13 03:28:27,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +14: [2023-05-13 03:28:27,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +13: [2023-05-13 03:28:27,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +14: [2023-05-13 03:28:27,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +24: [2023-05-13 03:28:27,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +21: [2023-05-13 03:28:27,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +21: [2023-05-13 03:28:27,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +21: [2023-05-13 03:28:27,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +14: [2023-05-13 03:28:27,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +16: [2023-05-13 03:28:27,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +16: [2023-05-13 03:28:27,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +14: [2023-05-13 03:28:27,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +16: [2023-05-13 03:28:27,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +24: [2023-05-13 03:28:27,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +24: [2023-05-13 03:28:27,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +24: [2023-05-13 03:28:27,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +27: [2023-05-13 03:28:27,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +21: [2023-05-13 03:28:27,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +21: [2023-05-13 03:28:27,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +21: [2023-05-13 03:28:27,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +21: [2023-05-13 03:28:27,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +21: [2023-05-13 03:28:27,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +11: [2023-05-13 03:28:27,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +24: [2023-05-13 03:28:27,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +16: [2023-05-13 03:28:27,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +16: [2023-05-13 03:28:27,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +24: [2023-05-13 03:28:27,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +24: [2023-05-13 03:28:27,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +11: [2023-05-13 03:28:27,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +24: [2023-05-13 03:28:27,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +11: [2023-05-13 03:28:27,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +31: [2023-05-13 03:28:27,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +31: [2023-05-13 03:28:27,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +29: [2023-05-13 03:28:27,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +11: [2023-05-13 03:28:27,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +13: [2023-05-13 03:28:27,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +21: [2023-05-13 03:28:27,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +21: [2023-05-13 03:28:27,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +21: [2023-05-13 03:28:27,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +11: [2023-05-13 03:28:27,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +13: [2023-05-13 03:28:27,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +13: [2023-05-13 03:28:27,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +13: [2023-05-13 03:28:27,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +29: [2023-05-13 03:28:27,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +11: [2023-05-13 03:28:27,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +11: [2023-05-13 03:28:27,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +15: [2023-05-13 03:28:27,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +13: [2023-05-13 03:28:27,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +31: [2023-05-13 03:28:27,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +31: [2023-05-13 03:28:27,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +31: [2023-05-13 03:28:27,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +31: [2023-05-13 03:28:27,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +31: [2023-05-13 03:28:27,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +13: [2023-05-13 03:28:27,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +31: [2023-05-13 03:28:27,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +13: [2023-05-13 03:28:27,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +13: [2023-05-13 03:28:27,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +29: [2023-05-13 03:28:27,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +29: [2023-05-13 03:28:27,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +29: [2023-05-13 03:28:27,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +29: [2023-05-13 03:28:27,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +31: [2023-05-13 03:28:27,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +31: [2023-05-13 03:28:27,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +12: [2023-05-13 03:28:27,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +12: [2023-05-13 03:28:27,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +21: [2023-05-13 03:28:27,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +21: [2023-05-13 03:28:27,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +12: [2023-05-13 03:28:27,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +21: [2023-05-13 03:28:27,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +21: [2023-05-13 03:28:27,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +21: [2023-05-13 03:28:27,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +28: [2023-05-13 03:28:27,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +28: [2023-05-13 03:28:27,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +28: [2023-05-13 03:28:27,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +28: [2023-05-13 03:28:27,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +28: [2023-05-13 03:28:27,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +28: [2023-05-13 03:28:27,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +28: [2023-05-13 03:28:27,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +28: [2023-05-13 03:28:27,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +27: [2023-05-13 03:28:27,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +27: [2023-05-13 03:28:27,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +31: [2023-05-13 03:28:27,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +31: [2023-05-13 03:28:27,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +31: [2023-05-13 03:28:27,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +28: [2023-05-13 03:28:27,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +31: [2023-05-13 03:28:27,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +31: [2023-05-13 03:28:27,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +27: [2023-05-13 03:28:27,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +27: [2023-05-13 03:28:27,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +31: [2023-05-13 03:28:27,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +10: [2023-05-13 03:28:27,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +10: [2023-05-13 03:28:27,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +28: [2023-05-13 03:28:27,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +12: [2023-05-13 03:28:27,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +12: [2023-05-13 03:28:27,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +12: [2023-05-13 03:28:27,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +12: [2023-05-13 03:28:27,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +28: [2023-05-13 03:28:27,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +12: [2023-05-13 03:28:27,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +10: [2023-05-13 03:28:27,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +10: [2023-05-13 03:28:27,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +10: [2023-05-13 03:28:27,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +10: [2023-05-13 03:28:27,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +10: [2023-05-13 03:28:27,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +10: [2023-05-13 03:28:27,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +10: [2023-05-13 03:28:27,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +10: [2023-05-13 03:28:27,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +28: [2023-05-13 03:28:27,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +28: [2023-05-13 03:28:27,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +28: [2023-05-13 03:28:27,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +28: [2023-05-13 03:28:27,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +15: [2023-05-13 03:28:27,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +28: [2023-05-13 03:28:27,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +23: [2023-05-13 03:28:27,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +23: [2023-05-13 03:28:27,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +23: [2023-05-13 03:28:27,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +23: [2023-05-13 03:28:27,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +23: [2023-05-13 03:28:27,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +23: [2023-05-13 03:28:27,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +23: [2023-05-13 03:28:27,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +23: [2023-05-13 03:28:27,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +10: [2023-05-13 03:28:27,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +20: [2023-05-13 03:28:27,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +20: [2023-05-13 03:28:27,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +15: [2023-05-13 03:28:27,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +10: [2023-05-13 03:28:27,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +10: [2023-05-13 03:28:27,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +10: [2023-05-13 03:28:27,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +12: [2023-05-13 03:28:27,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +12: [2023-05-13 03:28:27,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +10: [2023-05-13 03:28:27,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +23: [2023-05-13 03:28:27,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +23: [2023-05-13 03:28:27,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +10: [2023-05-13 03:28:27,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +15: [2023-05-13 03:28:27,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +30: [2023-05-13 03:28:27,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +30: [2023-05-13 03:28:27,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +30: [2023-05-13 03:28:27,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +30: [2023-05-13 03:28:27,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +30: [2023-05-13 03:28:27,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +30: [2023-05-13 03:28:27,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +30: [2023-05-13 03:28:27,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +30: [2023-05-13 03:28:27,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +23: [2023-05-13 03:28:27,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +23: [2023-05-13 03:28:27,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +26: [2023-05-13 03:28:27,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +26: [2023-05-13 03:28:27,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +26: [2023-05-13 03:28:27,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +23: [2023-05-13 03:28:27,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +15: [2023-05-13 03:28:27,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +15: [2023-05-13 03:28:27,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +15: [2023-05-13 03:28:27,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +23: [2023-05-13 03:28:27,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +23: [2023-05-13 03:28:27,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +23: [2023-05-13 03:28:27,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +12: [2023-05-13 03:28:27,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +29: [2023-05-13 03:28:27,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +15: [2023-05-13 03:28:27,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +30: [2023-05-13 03:28:27,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +30: [2023-05-13 03:28:27,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +30: [2023-05-13 03:28:27,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +30: [2023-05-13 03:28:27,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +11: [2023-05-13 03:28:27,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +30: [2023-05-13 03:28:27,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +30: [2023-05-13 03:28:27,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +30: [2023-05-13 03:28:27,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +30: [2023-05-13 03:28:27,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +14: [2023-05-13 03:28:27,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +14: [2023-05-13 03:28:27,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +14: [2023-05-13 03:28:27,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +26: [2023-05-13 03:28:27,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +26: [2023-05-13 03:28:27,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +26: [2023-05-13 03:28:27,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +16: [2023-05-13 03:28:27,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +16: [2023-05-13 03:28:27,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +16: [2023-05-13 03:28:27,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +12: [2023-05-13 03:28:27,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +15: [2023-05-13 03:28:27,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +26: [2023-05-13 03:28:27,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +26: [2023-05-13 03:28:27,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +20: [2023-05-13 03:28:27,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +20: [2023-05-13 03:28:27,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +20: [2023-05-13 03:28:27,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +24: [2023-05-13 03:28:27,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +12: [2023-05-13 03:28:27,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +21: [2023-05-13 03:28:27,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +21: [2023-05-13 03:28:27,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +21: [2023-05-13 03:28:27,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +12: [2023-05-13 03:28:27,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +12: [2023-05-13 03:28:27,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:27,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +12: [2023-05-13 03:28:27,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +20: [2023-05-13 03:28:27,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +20: [2023-05-13 03:28:27,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +20: [2023-05-13 03:28:27,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +24: [2023-05-13 03:28:27,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +20: [2023-05-13 03:28:27,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +13: [2023-05-13 03:28:27,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +13: [2023-05-13 03:28:27,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +13: [2023-05-13 03:28:27,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +24: [2023-05-13 03:28:27,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +15: [2023-05-13 03:28:27,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +20: [2023-05-13 03:28:27,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +31: [2023-05-13 03:28:27,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +31: [2023-05-13 03:28:27,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +14: [2023-05-13 03:28:27,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +16: [2023-05-13 03:28:27,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +16: [2023-05-13 03:28:27,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +16: [2023-05-13 03:28:27,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +16: [2023-05-13 03:28:27,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +16: [2023-05-13 03:28:27,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +26: [2023-05-13 03:28:27,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +11: [2023-05-13 03:28:27,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +26: [2023-05-13 03:28:27,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +26: [2023-05-13 03:28:27,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +11: [2023-05-13 03:28:27,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +28: [2023-05-13 03:28:27,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +14: [2023-05-13 03:28:27,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +14: [2023-05-13 03:28:27,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +14: [2023-05-13 03:28:27,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +14: [2023-05-13 03:28:27,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +24: [2023-05-13 03:28:27,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +13: [2023-05-13 03:28:27,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +13: [2023-05-13 03:28:27,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +13: [2023-05-13 03:28:27,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +13: [2023-05-13 03:28:27,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +13: [2023-05-13 03:28:27,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +11: [2023-05-13 03:28:27,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +15: [2023-05-13 03:28:27,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +25: [2023-05-13 03:28:27,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +25: [2023-05-13 03:28:27,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +15: [2023-05-13 03:28:27,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +21: [2023-05-13 03:28:27,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +21: [2023-05-13 03:28:27,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +25: [2023-05-13 03:28:27,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +25: [2023-05-13 03:28:27,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +25: [2023-05-13 03:28:27,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +25: [2023-05-13 03:28:27,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +25: [2023-05-13 03:28:27,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +15: [2023-05-13 03:28:27,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +24: [2023-05-13 03:28:27,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +24: [2023-05-13 03:28:27,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +24: [2023-05-13 03:28:27,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +26: [2023-05-13 03:28:27,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +15: [2023-05-13 03:28:27,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +10: [2023-05-13 03:28:27,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +10: [2023-05-13 03:28:27,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +14: [2023-05-13 03:28:27,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +21: [2023-05-13 03:28:27,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +21: [2023-05-13 03:28:27,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +21: [2023-05-13 03:28:27,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +25: [2023-05-13 03:28:27,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +26: [2023-05-13 03:28:27,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +26: [2023-05-13 03:28:27,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +21: [2023-05-13 03:28:27,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +15: [2023-05-13 03:28:27,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +16: [2023-05-13 03:28:27,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +16: [2023-05-13 03:28:27,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +16: [2023-05-13 03:28:27,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +21: [2023-05-13 03:28:27,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +21: [2023-05-13 03:28:27,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +14: [2023-05-13 03:28:27,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +11: [2023-05-13 03:28:27,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +11: [2023-05-13 03:28:27,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +31: [2023-05-13 03:28:27,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:27,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +25: [2023-05-13 03:28:27,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +25: [2023-05-13 03:28:27,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... +31: [2023-05-13 03:28:27,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +14: [2023-05-13 03:28:27,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:27,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +24: [2023-05-13 03:28:27,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +10: [2023-05-13 03:28:27,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +15: [2023-05-13 03:28:27,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +28: [2023-05-13 03:28:27,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +26: [2023-05-13 03:28:27,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +26: [2023-05-13 03:28:27,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +31: [2023-05-13 03:28:27,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +31: [2023-05-13 03:28:27,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +31: [2023-05-13 03:28:27,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +13: [2023-05-13 03:28:27,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +31: [2023-05-13 03:28:27,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +31: [2023-05-13 03:28:27,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +31: [2023-05-13 03:28:27,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +11: [2023-05-13 03:28:27,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +23: [2023-05-13 03:28:27,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +23: [2023-05-13 03:28:27,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +28: [2023-05-13 03:28:27,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +11: [2023-05-13 03:28:27,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +11: [2023-05-13 03:28:27,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +11: [2023-05-13 03:28:27,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +24: [2023-05-13 03:28:27,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +24: [2023-05-13 03:28:27,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +16: [2023-05-13 03:28:27,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +16: [2023-05-13 03:28:27,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +16: [2023-05-13 03:28:27,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +14: [2023-05-13 03:28:27,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +20: [2023-05-13 03:28:27,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +20: [2023-05-13 03:28:27,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +20: [2023-05-13 03:28:27,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +20: [2023-05-13 03:28:27,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +13: [2023-05-13 03:28:27,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +13: [2023-05-13 03:28:27,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +16: [2023-05-13 03:28:27,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +16: [2023-05-13 03:28:27,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +22: [2023-05-13 03:28:27,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +22: [2023-05-13 03:28:27,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +20: [2023-05-13 03:28:27,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +14: [2023-05-13 03:28:27,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +22: [2023-05-13 03:28:27,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +22: [2023-05-13 03:28:27,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +22: [2023-05-13 03:28:27,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +22: [2023-05-13 03:28:27,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +22: [2023-05-13 03:28:27,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +22: [2023-05-13 03:28:27,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +14: [2023-05-13 03:28:27,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +10: [2023-05-13 03:28:27,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +14: [2023-05-13 03:28:27,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +20: [2023-05-13 03:28:27,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +10: [2023-05-13 03:28:27,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +14: [2023-05-13 03:28:27,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:27,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +22: [2023-05-13 03:28:27,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +22: [2023-05-13 03:28:27,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +28: [2023-05-13 03:28:27,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +13: [2023-05-13 03:28:27,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +30: [2023-05-13 03:28:27,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +30: [2023-05-13 03:28:27,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +30: [2023-05-13 03:28:27,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +21: [2023-05-13 03:28:27,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +21: [2023-05-13 03:28:27,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +22: [2023-05-13 03:28:27,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +22: [2023-05-13 03:28:27,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +22: [2023-05-13 03:28:27,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +24: [2023-05-13 03:28:27,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +28: [2023-05-13 03:28:27,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +24: [2023-05-13 03:28:27,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +28: [2023-05-13 03:28:27,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +28: [2023-05-13 03:28:27,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +28: [2023-05-13 03:28:27,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +28: [2023-05-13 03:28:27,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +22: [2023-05-13 03:28:27,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +22: [2023-05-13 03:28:27,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +21: [2023-05-13 03:28:27,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +22: [2023-05-13 03:28:27,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +23: [2023-05-13 03:28:27,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +10: [2023-05-13 03:28:27,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +30: [2023-05-13 03:28:27,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +21: [2023-05-13 03:28:27,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +13: [2023-05-13 03:28:27,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +13: [2023-05-13 03:28:27,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +13: [2023-05-13 03:28:27,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:27,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +11: [2023-05-13 03:28:27,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +21: [2023-05-13 03:28:27,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +30: [2023-05-13 03:28:27,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +11: [2023-05-13 03:28:27,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +30: [2023-05-13 03:28:27,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +10: [2023-05-13 03:28:27,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +10: [2023-05-13 03:28:27,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +10: [2023-05-13 03:28:27,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +10: [2023-05-13 03:28:27,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +23: [2023-05-13 03:28:27,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +23: [2023-05-13 03:28:27,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +23: [2023-05-13 03:28:27,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +10: [2023-05-13 03:28:27,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +23: [2023-05-13 03:28:27,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +23: [2023-05-13 03:28:27,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +30: [2023-05-13 03:28:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +30: [2023-05-13 03:28:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +23: [2023-05-13 03:28:27,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +11: [2023-05-13 03:28:27,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +23: [2023-05-13 03:28:27,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +11: [2023-05-13 03:28:27,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +17: [2023-05-13 03:28:27,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +17: [2023-05-13 03:28:27,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +17: [2023-05-13 03:28:27,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +17: [2023-05-13 03:28:27,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +17: [2023-05-13 03:28:27,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +17: [2023-05-13 03:28:27,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +11: [2023-05-13 03:28:27,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +11: [2023-05-13 03:28:27,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +25: [2023-05-13 03:28:27,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 5: [2023-05-13 03:28:27,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +31: [2023-05-13 03:28:27,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +31: [2023-05-13 03:28:27,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +31: [2023-05-13 03:28:27,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +31: [2023-05-13 03:28:27,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +31: [2023-05-13 03:28:27,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +31: [2023-05-13 03:28:27,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +30: [2023-05-13 03:28:27,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +30: [2023-05-13 03:28:27,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +30: [2023-05-13 03:28:27,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +23: [2023-05-13 03:28:27,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +30: [2023-05-13 03:28:27,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 5: [2023-05-13 03:28:27,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:27,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +25: [2023-05-13 03:28:27,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +10: [2023-05-13 03:28:27,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +10: [2023-05-13 03:28:27,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +18: [2023-05-13 03:28:27,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +18: [2023-05-13 03:28:27,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +10: [2023-05-13 03:28:27,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +10: [2023-05-13 03:28:27,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +18: [2023-05-13 03:28:27,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +18: [2023-05-13 03:28:27,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +30: [2023-05-13 03:28:27,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +18: [2023-05-13 03:28:27,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +18: [2023-05-13 03:28:27,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +18: [2023-05-13 03:28:27,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +18: [2023-05-13 03:28:27,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +10: [2023-05-13 03:28:27,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +23: [2023-05-13 03:28:27,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +30: [2023-05-13 03:28:27,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +18: [2023-05-13 03:28:27,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +18: [2023-05-13 03:28:27,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +23: [2023-05-13 03:28:27,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:27,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +22: [2023-05-13 03:28:27,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +30: [2023-05-13 03:28:27,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +23: [2023-05-13 03:28:27,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +18: [2023-05-13 03:28:27,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +23: [2023-05-13 03:28:27,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +30: [2023-05-13 03:28:27,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:27,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +25: [2023-05-13 03:28:27,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +25: [2023-05-13 03:28:27,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +25: [2023-05-13 03:28:27,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_15-model_00-model_states.pt. +25: [2023-05-13 03:28:27,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +23: [2023-05-13 03:28:27,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +13: [2023-05-13 03:28:27,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +28: [2023-05-13 03:28:27,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +28: [2023-05-13 03:28:27,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +28: [2023-05-13 03:28:27,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +28: [2023-05-13 03:28:27,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +28: [2023-05-13 03:28:27,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +28: [2023-05-13 03:28:27,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +28: [2023-05-13 03:28:27,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +18: [2023-05-13 03:28:27,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +18: [2023-05-13 03:28:27,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +18: [2023-05-13 03:28:27,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +18: [2023-05-13 03:28:27,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +18: [2023-05-13 03:28:27,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +19: [2023-05-13 03:28:27,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +19: [2023-05-13 03:28:27,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 0: [2023-05-13 03:28:27,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 0: [2023-05-13 03:28:27,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +22: [2023-05-13 03:28:27,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +19: [2023-05-13 03:28:27,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +19: [2023-05-13 03:28:27,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +19: [2023-05-13 03:28:27,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +19: [2023-05-13 03:28:27,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +19: [2023-05-13 03:28:27,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +19: [2023-05-13 03:28:27,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +19: [2023-05-13 03:28:27,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +19: [2023-05-13 03:28:27,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +19: [2023-05-13 03:28:27,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +19: [2023-05-13 03:28:27,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +19: [2023-05-13 03:28:27,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +19: [2023-05-13 03:28:27,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +19: [2023-05-13 03:28:27,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +19: [2023-05-13 03:28:27,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +17: [2023-05-13 03:28:27,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +17: [2023-05-13 03:28:27,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +17: [2023-05-13 03:28:27,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +17: [2023-05-13 03:28:27,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +17: [2023-05-13 03:28:27,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +17: [2023-05-13 03:28:27,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +17: [2023-05-13 03:28:27,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +17: [2023-05-13 03:28:27,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +17: [2023-05-13 03:28:27,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +17: [2023-05-13 03:28:27,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +29: [2023-05-13 03:28:27,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +22: [2023-05-13 03:28:27,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +29: [2023-05-13 03:28:27,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +29: [2023-05-13 03:28:27,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +29: [2023-05-13 03:28:27,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +29: [2023-05-13 03:28:27,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +29: [2023-05-13 03:28:27,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +22: [2023-05-13 03:28:27,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +22: [2023-05-13 03:28:27,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +22: [2023-05-13 03:28:27,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +22: [2023-05-13 03:28:27,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +22: [2023-05-13 03:28:27,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +22: [2023-05-13 03:28:27,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +25: [2023-05-13 03:28:27,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +22: [2023-05-13 03:28:27,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +29: [2023-05-13 03:28:27,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +18: [2023-05-13 03:28:27,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +18: [2023-05-13 03:28:27,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +18: [2023-05-13 03:28:27,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +22: [2023-05-13 03:28:27,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +17: [2023-05-13 03:28:27,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +17: [2023-05-13 03:28:27,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +18: [2023-05-13 03:28:27,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +17: [2023-05-13 03:28:27,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +17: [2023-05-13 03:28:27,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +22: [2023-05-13 03:28:27,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +22: [2023-05-13 03:28:27,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +22: [2023-05-13 03:28:27,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +22: [2023-05-13 03:28:27,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +17: [2023-05-13 03:28:27,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +22: [2023-05-13 03:28:27,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +17: [2023-05-13 03:28:27,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +17: [2023-05-13 03:28:27,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +17: [2023-05-13 03:28:27,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +17: [2023-05-13 03:28:27,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +18: [2023-05-13 03:28:27,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +18: [2023-05-13 03:28:27,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +18: [2023-05-13 03:28:27,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +18: [2023-05-13 03:28:27,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +19: [2023-05-13 03:28:27,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +19: [2023-05-13 03:28:27,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +19: [2023-05-13 03:28:27,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +19: [2023-05-13 03:28:27,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +19: [2023-05-13 03:28:27,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +18: [2023-05-13 03:28:27,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +18: [2023-05-13 03:28:27,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +18: [2023-05-13 03:28:27,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +29: [2023-05-13 03:28:27,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +29: [2023-05-13 03:28:27,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +27: [2023-05-13 03:28:27,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +27: [2023-05-13 03:28:27,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +27: [2023-05-13 03:28:27,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +27: [2023-05-13 03:28:27,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +27: [2023-05-13 03:28:27,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +27: [2023-05-13 03:28:27,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +27: [2023-05-13 03:28:27,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +27: [2023-05-13 03:28:27,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +27: [2023-05-13 03:28:27,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +18: [2023-05-13 03:28:27,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +19: [2023-05-13 03:28:27,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +19: [2023-05-13 03:28:27,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +19: [2023-05-13 03:28:27,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +27: [2023-05-13 03:28:27,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +27: [2023-05-13 03:28:27,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +27: [2023-05-13 03:28:27,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +17: [2023-05-13 03:28:27,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +27: [2023-05-13 03:28:27,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +18: [2023-05-13 03:28:27,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +27: [2023-05-13 03:28:27,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +27: [2023-05-13 03:28:27,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +20: [2023-05-13 03:28:27,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +20: [2023-05-13 03:28:27,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +27: [2023-05-13 03:28:27,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +18: [2023-05-13 03:28:27,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +19: [2023-05-13 03:28:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +20: [2023-05-13 03:28:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +20: [2023-05-13 03:28:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +20: [2023-05-13 03:28:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +20: [2023-05-13 03:28:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +20: [2023-05-13 03:28:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +15: [2023-05-13 03:28:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +20: [2023-05-13 03:28:27,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +17: [2023-05-13 03:28:27,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +15: [2023-05-13 03:28:27,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +15: [2023-05-13 03:28:27,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +15: [2023-05-13 03:28:27,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +15: [2023-05-13 03:28:27,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +15: [2023-05-13 03:28:27,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +15: [2023-05-13 03:28:27,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +15: [2023-05-13 03:28:27,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +18: [2023-05-13 03:28:27,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +18: [2023-05-13 03:28:27,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +20: [2023-05-13 03:28:27,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +20: [2023-05-13 03:28:27,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +17: [2023-05-13 03:28:27,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +17: [2023-05-13 03:28:27,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +15: [2023-05-13 03:28:27,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +17: [2023-05-13 03:28:27,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +17: [2023-05-13 03:28:27,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +17: [2023-05-13 03:28:27,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +29: [2023-05-13 03:28:27,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +29: [2023-05-13 03:28:27,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +19: [2023-05-13 03:28:27,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +19: [2023-05-13 03:28:27,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +19: [2023-05-13 03:28:27,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +19: [2023-05-13 03:28:27,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +20: [2023-05-13 03:28:27,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +29: [2023-05-13 03:28:27,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +29: [2023-05-13 03:28:27,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +29: [2023-05-13 03:28:27,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 8: [2023-05-13 03:28:27,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +20: [2023-05-13 03:28:27,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 8: [2023-05-13 03:28:27,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +20: [2023-05-13 03:28:27,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +20: [2023-05-13 03:28:27,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +20: [2023-05-13 03:28:27,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +20: [2023-05-13 03:28:27,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +15: [2023-05-13 03:28:27,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +15: [2023-05-13 03:28:27,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +15: [2023-05-13 03:28:27,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +15: [2023-05-13 03:28:27,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +15: [2023-05-13 03:28:27,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +15: [2023-05-13 03:28:27,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +15: [2023-05-13 03:28:27,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +19: [2023-05-13 03:28:27,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +19: [2023-05-13 03:28:27,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +19: [2023-05-13 03:28:27,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 7: [2023-05-13 03:28:27,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 7: [2023-05-13 03:28:27,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +16: [2023-05-13 03:28:27,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +16: [2023-05-13 03:28:27,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +16: [2023-05-13 03:28:27,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +16: [2023-05-13 03:28:27,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +16: [2023-05-13 03:28:27,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +16: [2023-05-13 03:28:27,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +16: [2023-05-13 03:28:27,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +16: [2023-05-13 03:28:27,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +27: [2023-05-13 03:28:27,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +16: [2023-05-13 03:28:27,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +16: [2023-05-13 03:28:27,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +16: [2023-05-13 03:28:27,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +29: [2023-05-13 03:28:27,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +24: [2023-05-13 03:28:27,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +24: [2023-05-13 03:28:27,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +24: [2023-05-13 03:28:27,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +24: [2023-05-13 03:28:27,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +24: [2023-05-13 03:28:27,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +24: [2023-05-13 03:28:27,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +24: [2023-05-13 03:28:27,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +24: [2023-05-13 03:28:27,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +16: [2023-05-13 03:28:27,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +16: [2023-05-13 03:28:27,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +29: [2023-05-13 03:28:27,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +16: [2023-05-13 03:28:27,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +16: [2023-05-13 03:28:27,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +16: [2023-05-13 03:28:27,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +29: [2023-05-13 03:28:27,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +24: [2023-05-13 03:28:27,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +24: [2023-05-13 03:28:27,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +24: [2023-05-13 03:28:27,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +24: [2023-05-13 03:28:27,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +24: [2023-05-13 03:28:27,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +24: [2023-05-13 03:28:27,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +24: [2023-05-13 03:28:27,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +24: [2023-05-13 03:28:27,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +15: [2023-05-13 03:28:27,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +20: [2023-05-13 03:28:27,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +20: [2023-05-13 03:28:27,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +26: [2023-05-13 03:28:27,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +26: [2023-05-13 03:28:27,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +26: [2023-05-13 03:28:27,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +26: [2023-05-13 03:28:27,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +27: [2023-05-13 03:28:27,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +26: [2023-05-13 03:28:27,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +26: [2023-05-13 03:28:27,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +26: [2023-05-13 03:28:27,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +26: [2023-05-13 03:28:27,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +26: [2023-05-13 03:28:27,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +26: [2023-05-13 03:28:27,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +26: [2023-05-13 03:28:27,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +26: [2023-05-13 03:28:27,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +26: [2023-05-13 03:28:27,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +26: [2023-05-13 03:28:27,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +26: [2023-05-13 03:28:27,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +26: [2023-05-13 03:28:27,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +27: [2023-05-13 03:28:27,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +27: [2023-05-13 03:28:27,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +20: [2023-05-13 03:28:27,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +27: [2023-05-13 03:28:27,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +27: [2023-05-13 03:28:27,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +27: [2023-05-13 03:28:27,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +27: [2023-05-13 03:28:27,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +27: [2023-05-13 03:28:27,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +21: [2023-05-13 03:28:27,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +21: [2023-05-13 03:28:27,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +15: [2023-05-13 03:28:27,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +21: [2023-05-13 03:28:27,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +21: [2023-05-13 03:28:27,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +21: [2023-05-13 03:28:27,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +21: [2023-05-13 03:28:27,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +21: [2023-05-13 03:28:27,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +21: [2023-05-13 03:28:27,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +21: [2023-05-13 03:28:27,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +21: [2023-05-13 03:28:27,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +20: [2023-05-13 03:28:27,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +20: [2023-05-13 03:28:27,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +20: [2023-05-13 03:28:27,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +20: [2023-05-13 03:28:27,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +20: [2023-05-13 03:28:27,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +20: [2023-05-13 03:28:27,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +21: [2023-05-13 03:28:27,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +15: [2023-05-13 03:28:27,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +15: [2023-05-13 03:28:27,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +15: [2023-05-13 03:28:27,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +15: [2023-05-13 03:28:27,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +15: [2023-05-13 03:28:27,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +15: [2023-05-13 03:28:27,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +15: [2023-05-13 03:28:27,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 2: [2023-05-13 03:28:27,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:27,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +25: [2023-05-13 03:28:27,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +20: [2023-05-13 03:28:27,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +21: [2023-05-13 03:28:27,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +21: [2023-05-13 03:28:27,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +21: [2023-05-13 03:28:27,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +21: [2023-05-13 03:28:27,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +25: [2023-05-13 03:28:27,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +25: [2023-05-13 03:28:27,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +25: [2023-05-13 03:28:27,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +25: [2023-05-13 03:28:27,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +21: [2023-05-13 03:28:27,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +16: [2023-05-13 03:28:27,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +25: [2023-05-13 03:28:27,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +20: [2023-05-13 03:28:27,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:27,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... +25: [2023-05-13 03:28:27,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:27,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +25: [2023-05-13 03:28:27,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:27,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +27: [2023-05-13 03:28:27,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +27: [2023-05-13 03:28:27,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +16: [2023-05-13 03:28:27,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +16: [2023-05-13 03:28:27,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +16: [2023-05-13 03:28:27,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +16: [2023-05-13 03:28:27,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +16: [2023-05-13 03:28:27,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +16: [2023-05-13 03:28:27,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +16: [2023-05-13 03:28:27,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +24: [2023-05-13 03:28:27,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +24: [2023-05-13 03:28:27,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:27,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 4: [2023-05-13 03:28:27,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 9: [2023-05-13 03:28:27,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +27: [2023-05-13 03:28:27,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 2: [2023-05-13 03:28:27,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 1: [2023-05-13 03:28:27,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 3: [2023-05-13 03:28:27,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +20: [2023-05-13 03:28:27,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +27: [2023-05-13 03:28:27,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +27: [2023-05-13 03:28:27,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 9: [2023-05-13 03:28:27,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +27: [2023-05-13 03:28:27,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:27,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +20: [2023-05-13 03:28:27,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +16: [2023-05-13 03:28:27,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +20: [2023-05-13 03:28:27,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +26: [2023-05-13 03:28:27,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +26: [2023-05-13 03:28:27,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +26: [2023-05-13 03:28:27,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +27: [2023-05-13 03:28:27,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:27,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +24: [2023-05-13 03:28:27,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +24: [2023-05-13 03:28:27,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +24: [2023-05-13 03:28:27,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +20: [2023-05-13 03:28:27,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +20: [2023-05-13 03:28:27,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +15: [2023-05-13 03:28:27,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +15: [2023-05-13 03:28:27,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 4: [2023-05-13 03:28:27,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +15: [2023-05-13 03:28:27,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +15: [2023-05-13 03:28:27,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +15: [2023-05-13 03:28:27,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +15: [2023-05-13 03:28:27,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +15: [2023-05-13 03:28:27,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +26: [2023-05-13 03:28:27,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +16: [2023-05-13 03:28:27,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +26: [2023-05-13 03:28:27,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +21: [2023-05-13 03:28:27,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +26: [2023-05-13 03:28:27,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +24: [2023-05-13 03:28:27,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +16: [2023-05-13 03:28:27,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +16: [2023-05-13 03:28:27,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +16: [2023-05-13 03:28:27,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:27,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +26: [2023-05-13 03:28:27,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +26: [2023-05-13 03:28:27,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +16: [2023-05-13 03:28:27,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +16: [2023-05-13 03:28:27,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +16: [2023-05-13 03:28:27,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:27,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 3: [2023-05-13 03:28:27,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +21: [2023-05-13 03:28:27,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +21: [2023-05-13 03:28:27,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +26: [2023-05-13 03:28:27,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +26: [2023-05-13 03:28:27,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +26: [2023-05-13 03:28:27,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:27,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:27,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:27,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:27,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:27,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:27,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +21: [2023-05-13 03:28:27,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +21: [2023-05-13 03:28:27,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +25: [2023-05-13 03:28:27,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +25: [2023-05-13 03:28:27,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +25: [2023-05-13 03:28:27,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +21: [2023-05-13 03:28:27,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +21: [2023-05-13 03:28:27,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +21: [2023-05-13 03:28:27,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +21: [2023-05-13 03:28:27,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +25: [2023-05-13 03:28:27,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +25: [2023-05-13 03:28:27,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +26: [2023-05-13 03:28:27,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +26: [2023-05-13 03:28:27,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +26: [2023-05-13 03:28:27,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +26: [2023-05-13 03:28:27,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +26: [2023-05-13 03:28:27,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +21: [2023-05-13 03:28:27,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +21: [2023-05-13 03:28:27,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +25: [2023-05-13 03:28:27,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. + 6: [2023-05-13 03:28:27,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +25: [2023-05-13 03:28:27,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +25: [2023-05-13 03:28:27,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_16-model_00-model_states.pt. +21: [2023-05-13 03:28:27,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +21: [2023-05-13 03:28:27,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:27,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:27,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:27,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +21: [2023-05-13 03:28:27,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:27,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +21: [2023-05-13 03:28:27,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:27,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +21: [2023-05-13 03:28:27,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:27,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:27,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 6: [2023-05-13 03:28:27,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:27,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +10: [2023-05-13 03:28:28,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +10: [2023-05-13 03:28:28,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +10: [2023-05-13 03:28:28,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +10: [2023-05-13 03:28:28,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +10: [2023-05-13 03:28:28,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +10: [2023-05-13 03:28:28,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +10: [2023-05-13 03:28:28,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +10: [2023-05-13 03:28:28,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +23: [2023-05-13 03:28:28,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +28: [2023-05-13 03:28:28,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +28: [2023-05-13 03:28:28,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +23: [2023-05-13 03:28:28,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +28: [2023-05-13 03:28:28,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +28: [2023-05-13 03:28:28,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +28: [2023-05-13 03:28:28,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +28: [2023-05-13 03:28:28,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +28: [2023-05-13 03:28:28,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +28: [2023-05-13 03:28:28,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +23: [2023-05-13 03:28:28,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +22: [2023-05-13 03:28:28,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +22: [2023-05-13 03:28:28,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +22: [2023-05-13 03:28:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +22: [2023-05-13 03:28:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +23: [2023-05-13 03:28:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +22: [2023-05-13 03:28:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +22: [2023-05-13 03:28:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +22: [2023-05-13 03:28:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +23: [2023-05-13 03:28:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +22: [2023-05-13 03:28:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +23: [2023-05-13 03:28:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +23: [2023-05-13 03:28:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +23: [2023-05-13 03:28:28,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +10: [2023-05-13 03:28:28,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +10: [2023-05-13 03:28:28,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +28: [2023-05-13 03:28:28,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +23: [2023-05-13 03:28:28,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +23: [2023-05-13 03:28:28,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +10: [2023-05-13 03:28:28,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +22: [2023-05-13 03:28:28,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +22: [2023-05-13 03:28:28,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +10: [2023-05-13 03:28:28,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +10: [2023-05-13 03:28:28,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +10: [2023-05-13 03:28:28,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +10: [2023-05-13 03:28:28,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +10: [2023-05-13 03:28:28,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +28: [2023-05-13 03:28:28,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +23: [2023-05-13 03:28:28,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +23: [2023-05-13 03:28:28,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +23: [2023-05-13 03:28:28,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +22: [2023-05-13 03:28:28,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +22: [2023-05-13 03:28:28,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +23: [2023-05-13 03:28:28,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +23: [2023-05-13 03:28:28,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +28: [2023-05-13 03:28:28,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +28: [2023-05-13 03:28:28,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +23: [2023-05-13 03:28:28,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +28: [2023-05-13 03:28:28,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +22: [2023-05-13 03:28:28,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +22: [2023-05-13 03:28:28,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +12: [2023-05-13 03:28:28,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +12: [2023-05-13 03:28:28,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +12: [2023-05-13 03:28:28,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +28: [2023-05-13 03:28:28,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +22: [2023-05-13 03:28:28,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +12: [2023-05-13 03:28:28,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +12: [2023-05-13 03:28:28,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +12: [2023-05-13 03:28:28,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +12: [2023-05-13 03:28:28,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +28: [2023-05-13 03:28:28,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +22: [2023-05-13 03:28:28,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +28: [2023-05-13 03:28:28,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +12: [2023-05-13 03:28:28,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +12: [2023-05-13 03:28:28,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +12: [2023-05-13 03:28:28,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +12: [2023-05-13 03:28:28,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +12: [2023-05-13 03:28:28,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +12: [2023-05-13 03:28:28,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +12: [2023-05-13 03:28:28,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +12: [2023-05-13 03:28:28,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +12: [2023-05-13 03:28:28,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +17: [2023-05-13 03:28:28,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +17: [2023-05-13 03:28:28,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +17: [2023-05-13 03:28:28,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +17: [2023-05-13 03:28:28,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +17: [2023-05-13 03:28:28,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +17: [2023-05-13 03:28:28,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +17: [2023-05-13 03:28:28,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +17: [2023-05-13 03:28:28,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +17: [2023-05-13 03:28:28,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +13: [2023-05-13 03:28:28,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +13: [2023-05-13 03:28:28,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +13: [2023-05-13 03:28:28,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +13: [2023-05-13 03:28:28,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +13: [2023-05-13 03:28:28,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +13: [2023-05-13 03:28:28,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +13: [2023-05-13 03:28:28,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +13: [2023-05-13 03:28:28,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +17: [2023-05-13 03:28:28,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +17: [2023-05-13 03:28:28,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +17: [2023-05-13 03:28:28,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +17: [2023-05-13 03:28:28,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +13: [2023-05-13 03:28:28,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +13: [2023-05-13 03:28:28,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +17: [2023-05-13 03:28:28,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +17: [2023-05-13 03:28:28,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +17: [2023-05-13 03:28:28,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +13: [2023-05-13 03:28:28,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +13: [2023-05-13 03:28:28,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +13: [2023-05-13 03:28:28,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +13: [2023-05-13 03:28:28,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +13: [2023-05-13 03:28:28,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +13: [2023-05-13 03:28:28,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +28: [2023-05-13 03:28:28,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +10: [2023-05-13 03:28:28,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +11: [2023-05-13 03:28:28,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +11: [2023-05-13 03:28:28,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +11: [2023-05-13 03:28:28,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +11: [2023-05-13 03:28:28,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +11: [2023-05-13 03:28:28,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +11: [2023-05-13 03:28:28,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +11: [2023-05-13 03:28:28,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +11: [2023-05-13 03:28:28,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +10: [2023-05-13 03:28:28,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +14: [2023-05-13 03:28:28,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +14: [2023-05-13 03:28:28,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +30: [2023-05-13 03:28:28,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +14: [2023-05-13 03:28:28,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +30: [2023-05-13 03:28:28,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +30: [2023-05-13 03:28:28,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +30: [2023-05-13 03:28:28,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +30: [2023-05-13 03:28:28,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +14: [2023-05-13 03:28:28,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +30: [2023-05-13 03:28:28,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +30: [2023-05-13 03:28:28,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +30: [2023-05-13 03:28:28,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +14: [2023-05-13 03:28:28,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +14: [2023-05-13 03:28:28,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +14: [2023-05-13 03:28:28,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +14: [2023-05-13 03:28:28,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +23: [2023-05-13 03:28:28,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +11: [2023-05-13 03:28:28,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +23: [2023-05-13 03:28:28,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +22: [2023-05-13 03:28:28,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +14: [2023-05-13 03:28:28,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +30: [2023-05-13 03:28:28,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +14: [2023-05-13 03:28:28,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +30: [2023-05-13 03:28:28,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +14: [2023-05-13 03:28:28,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +22: [2023-05-13 03:28:28,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +30: [2023-05-13 03:28:28,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +30: [2023-05-13 03:28:28,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +30: [2023-05-13 03:28:28,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +14: [2023-05-13 03:28:28,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +30: [2023-05-13 03:28:28,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +14: [2023-05-13 03:28:28,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +30: [2023-05-13 03:28:28,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +14: [2023-05-13 03:28:28,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +30: [2023-05-13 03:28:28,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +14: [2023-05-13 03:28:28,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +11: [2023-05-13 03:28:28,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +11: [2023-05-13 03:28:28,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +14: [2023-05-13 03:28:28,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +11: [2023-05-13 03:28:28,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +11: [2023-05-13 03:28:28,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +11: [2023-05-13 03:28:28,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +11: [2023-05-13 03:28:28,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +11: [2023-05-13 03:28:28,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +28: [2023-05-13 03:28:28,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +10: [2023-05-13 03:28:28,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +12: [2023-05-13 03:28:28,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +12: [2023-05-13 03:28:28,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +31: [2023-05-13 03:28:28,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +31: [2023-05-13 03:28:28,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +31: [2023-05-13 03:28:28,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +31: [2023-05-13 03:28:28,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +31: [2023-05-13 03:28:28,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +31: [2023-05-13 03:28:28,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +31: [2023-05-13 03:28:28,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +31: [2023-05-13 03:28:28,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +28: [2023-05-13 03:28:28,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +12: [2023-05-13 03:28:28,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +10: [2023-05-13 03:28:28,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +12: [2023-05-13 03:28:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +10: [2023-05-13 03:28:28,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +31: [2023-05-13 03:28:28,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +31: [2023-05-13 03:28:28,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +10: [2023-05-13 03:28:28,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +22: [2023-05-13 03:28:28,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +23: [2023-05-13 03:28:28,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +23: [2023-05-13 03:28:28,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +23: [2023-05-13 03:28:28,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +31: [2023-05-13 03:28:28,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +31: [2023-05-13 03:28:28,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +22: [2023-05-13 03:28:28,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +22: [2023-05-13 03:28:28,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +23: [2023-05-13 03:28:28,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +31: [2023-05-13 03:28:28,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +23: [2023-05-13 03:28:28,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +23: [2023-05-13 03:28:28,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +23: [2023-05-13 03:28:28,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +31: [2023-05-13 03:28:28,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +10: [2023-05-13 03:28:28,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +10: [2023-05-13 03:28:28,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +10: [2023-05-13 03:28:28,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +10: [2023-05-13 03:28:28,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +23: [2023-05-13 03:28:28,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +31: [2023-05-13 03:28:28,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +31: [2023-05-13 03:28:28,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +28: [2023-05-13 03:28:28,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +28: [2023-05-13 03:28:28,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +12: [2023-05-13 03:28:28,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +12: [2023-05-13 03:28:28,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +12: [2023-05-13 03:28:28,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +12: [2023-05-13 03:28:28,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +17: [2023-05-13 03:28:28,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +22: [2023-05-13 03:28:28,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +22: [2023-05-13 03:28:28,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +22: [2023-05-13 03:28:28,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +22: [2023-05-13 03:28:28,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +22: [2023-05-13 03:28:28,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +13: [2023-05-13 03:28:28,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +28: [2023-05-13 03:28:28,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +28: [2023-05-13 03:28:28,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +28: [2023-05-13 03:28:28,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +28: [2023-05-13 03:28:28,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +10: [2023-05-13 03:28:28,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +28: [2023-05-13 03:28:28,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +12: [2023-05-13 03:28:28,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +12: [2023-05-13 03:28:28,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +12: [2023-05-13 03:28:28,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +10: [2023-05-13 03:28:28,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +12: [2023-05-13 03:28:28,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +13: [2023-05-13 03:28:28,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +22: [2023-05-13 03:28:28,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +17: [2023-05-13 03:28:28,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +11: [2023-05-13 03:28:28,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +13: [2023-05-13 03:28:28,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +13: [2023-05-13 03:28:28,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +18: [2023-05-13 03:28:28,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +18: [2023-05-13 03:28:28,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +18: [2023-05-13 03:28:28,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +18: [2023-05-13 03:28:28,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +18: [2023-05-13 03:28:28,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +18: [2023-05-13 03:28:28,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +18: [2023-05-13 03:28:28,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +18: [2023-05-13 03:28:28,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +13: [2023-05-13 03:28:28,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +12: [2023-05-13 03:28:28,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +10: [2023-05-13 03:28:28,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +10: [2023-05-13 03:28:28,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +12: [2023-05-13 03:28:28,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +28: [2023-05-13 03:28:28,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +12: [2023-05-13 03:28:28,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +28: [2023-05-13 03:28:28,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +13: [2023-05-13 03:28:28,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +12: [2023-05-13 03:28:28,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +23: [2023-05-13 03:28:28,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +23: [2023-05-13 03:28:28,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +22: [2023-05-13 03:28:28,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +10: [2023-05-13 03:28:28,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +10: [2023-05-13 03:28:28,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +23: [2023-05-13 03:28:28,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +22: [2023-05-13 03:28:28,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +23: [2023-05-13 03:28:28,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +18: [2023-05-13 03:28:28,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +18: [2023-05-13 03:28:28,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +23: [2023-05-13 03:28:28,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +18: [2023-05-13 03:28:28,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +14: [2023-05-13 03:28:28,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +14: [2023-05-13 03:28:28,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +14: [2023-05-13 03:28:28,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +30: [2023-05-13 03:28:28,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +18: [2023-05-13 03:28:28,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +23: [2023-05-13 03:28:28,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +18: [2023-05-13 03:28:28,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +18: [2023-05-13 03:28:28,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +30: [2023-05-13 03:28:28,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +30: [2023-05-13 03:28:28,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +18: [2023-05-13 03:28:28,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +18: [2023-05-13 03:28:28,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +13: [2023-05-13 03:28:28,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +22: [2023-05-13 03:28:28,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +13: [2023-05-13 03:28:28,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +30: [2023-05-13 03:28:28,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +13: [2023-05-13 03:28:28,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +22: [2023-05-13 03:28:28,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +22: [2023-05-13 03:28:28,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +28: [2023-05-13 03:28:28,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +28: [2023-05-13 03:28:28,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +17: [2023-05-13 03:28:28,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +17: [2023-05-13 03:28:28,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +17: [2023-05-13 03:28:28,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +17: [2023-05-13 03:28:28,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +17: [2023-05-13 03:28:28,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +17: [2023-05-13 03:28:28,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +17: [2023-05-13 03:28:28,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +11: [2023-05-13 03:28:28,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +13: [2023-05-13 03:28:28,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +31: [2023-05-13 03:28:28,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +31: [2023-05-13 03:28:28,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +14: [2023-05-13 03:28:28,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +28: [2023-05-13 03:28:28,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +28: [2023-05-13 03:28:28,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +13: [2023-05-13 03:28:28,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +30: [2023-05-13 03:28:28,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +30: [2023-05-13 03:28:28,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +30: [2023-05-13 03:28:28,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +30: [2023-05-13 03:28:28,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +14: [2023-05-13 03:28:28,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +14: [2023-05-13 03:28:28,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +14: [2023-05-13 03:28:28,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +14: [2023-05-13 03:28:28,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +13: [2023-05-13 03:28:28,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +11: [2023-05-13 03:28:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +11: [2023-05-13 03:28:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +11: [2023-05-13 03:28:28,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +13: [2023-05-13 03:28:28,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +14: [2023-05-13 03:28:28,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +11: [2023-05-13 03:28:28,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +11: [2023-05-13 03:28:28,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +11: [2023-05-13 03:28:28,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +14: [2023-05-13 03:28:28,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +11: [2023-05-13 03:28:28,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +30: [2023-05-13 03:28:28,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +14: [2023-05-13 03:28:28,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +30: [2023-05-13 03:28:28,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +30: [2023-05-13 03:28:28,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +30: [2023-05-13 03:28:28,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +31: [2023-05-13 03:28:28,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +31: [2023-05-13 03:28:28,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +13: [2023-05-13 03:28:28,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +15: [2023-05-13 03:28:28,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +15: [2023-05-13 03:28:28,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +15: [2023-05-13 03:28:28,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +15: [2023-05-13 03:28:28,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +15: [2023-05-13 03:28:28,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +15: [2023-05-13 03:28:28,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +15: [2023-05-13 03:28:28,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +15: [2023-05-13 03:28:28,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +13: [2023-05-13 03:28:28,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +31: [2023-05-13 03:28:28,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +31: [2023-05-13 03:28:28,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +31: [2023-05-13 03:28:28,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +13: [2023-05-13 03:28:28,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +15: [2023-05-13 03:28:28,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +14: [2023-05-13 03:28:28,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +31: [2023-05-13 03:28:28,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +31: [2023-05-13 03:28:28,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +31: [2023-05-13 03:28:28,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +30: [2023-05-13 03:28:28,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +30: [2023-05-13 03:28:28,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +30: [2023-05-13 03:28:28,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +30: [2023-05-13 03:28:28,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +15: [2023-05-13 03:28:28,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +17: [2023-05-13 03:28:28,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +15: [2023-05-13 03:28:28,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +14: [2023-05-13 03:28:28,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +15: [2023-05-13 03:28:28,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +15: [2023-05-13 03:28:28,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +29: [2023-05-13 03:28:28,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +29: [2023-05-13 03:28:28,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +15: [2023-05-13 03:28:28,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +17: [2023-05-13 03:28:28,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +14: [2023-05-13 03:28:28,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +14: [2023-05-13 03:28:28,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +15: [2023-05-13 03:28:28,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +14: [2023-05-13 03:28:28,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +17: [2023-05-13 03:28:28,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +15: [2023-05-13 03:28:28,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +17: [2023-05-13 03:28:28,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +17: [2023-05-13 03:28:28,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +29: [2023-05-13 03:28:28,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +17: [2023-05-13 03:28:28,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +29: [2023-05-13 03:28:28,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +29: [2023-05-13 03:28:28,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +29: [2023-05-13 03:28:28,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +29: [2023-05-13 03:28:28,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +29: [2023-05-13 03:28:28,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +17: [2023-05-13 03:28:28,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +29: [2023-05-13 03:28:28,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +11: [2023-05-13 03:28:28,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +29: [2023-05-13 03:28:28,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +11: [2023-05-13 03:28:28,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +18: [2023-05-13 03:28:28,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +18: [2023-05-13 03:28:28,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +18: [2023-05-13 03:28:28,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +11: [2023-05-13 03:28:28,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +27: [2023-05-13 03:28:28,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +27: [2023-05-13 03:28:28,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +27: [2023-05-13 03:28:28,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +27: [2023-05-13 03:28:28,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +27: [2023-05-13 03:28:28,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +27: [2023-05-13 03:28:28,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +27: [2023-05-13 03:28:28,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +19: [2023-05-13 03:28:28,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +27: [2023-05-13 03:28:28,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +19: [2023-05-13 03:28:28,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +19: [2023-05-13 03:28:28,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +19: [2023-05-13 03:28:28,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +19: [2023-05-13 03:28:28,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +19: [2023-05-13 03:28:28,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +19: [2023-05-13 03:28:28,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +29: [2023-05-13 03:28:28,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +29: [2023-05-13 03:28:28,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +19: [2023-05-13 03:28:28,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +29: [2023-05-13 03:28:28,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +29: [2023-05-13 03:28:28,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +18: [2023-05-13 03:28:28,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +11: [2023-05-13 03:28:28,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +29: [2023-05-13 03:28:28,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +29: [2023-05-13 03:28:28,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +11: [2023-05-13 03:28:28,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +27: [2023-05-13 03:28:28,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +11: [2023-05-13 03:28:28,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +11: [2023-05-13 03:28:28,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +31: [2023-05-13 03:28:28,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +19: [2023-05-13 03:28:28,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +19: [2023-05-13 03:28:28,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +27: [2023-05-13 03:28:28,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +19: [2023-05-13 03:28:28,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +31: [2023-05-13 03:28:28,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +19: [2023-05-13 03:28:28,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +19: [2023-05-13 03:28:28,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +19: [2023-05-13 03:28:28,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +31: [2023-05-13 03:28:28,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +19: [2023-05-13 03:28:28,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +19: [2023-05-13 03:28:28,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +27: [2023-05-13 03:28:28,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +18: [2023-05-13 03:28:28,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +18: [2023-05-13 03:28:28,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +18: [2023-05-13 03:28:28,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +18: [2023-05-13 03:28:28,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +31: [2023-05-13 03:28:28,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +27: [2023-05-13 03:28:28,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +27: [2023-05-13 03:28:28,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +27: [2023-05-13 03:28:28,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +27: [2023-05-13 03:28:28,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +31: [2023-05-13 03:28:28,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +31: [2023-05-13 03:28:28,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +27: [2023-05-13 03:28:28,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +18: [2023-05-13 03:28:28,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +18: [2023-05-13 03:28:28,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +18: [2023-05-13 03:28:28,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +20: [2023-05-13 03:28:28,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +20: [2023-05-13 03:28:28,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +20: [2023-05-13 03:28:28,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +20: [2023-05-13 03:28:28,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +20: [2023-05-13 03:28:28,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +20: [2023-05-13 03:28:28,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +20: [2023-05-13 03:28:28,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +20: [2023-05-13 03:28:28,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +24: [2023-05-13 03:28:28,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +24: [2023-05-13 03:28:28,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +24: [2023-05-13 03:28:28,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +24: [2023-05-13 03:28:28,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +24: [2023-05-13 03:28:28,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +24: [2023-05-13 03:28:28,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +24: [2023-05-13 03:28:28,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +24: [2023-05-13 03:28:28,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +18: [2023-05-13 03:28:28,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +15: [2023-05-13 03:28:28,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +20: [2023-05-13 03:28:28,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +20: [2023-05-13 03:28:28,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:28,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:28,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +20: [2023-05-13 03:28:28,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +24: [2023-05-13 03:28:28,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:28,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:28,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +20: [2023-05-13 03:28:28,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:28,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +20: [2023-05-13 03:28:28,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:28,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +20: [2023-05-13 03:28:28,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +20: [2023-05-13 03:28:28,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +20: [2023-05-13 03:28:28,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:28,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +18: [2023-05-13 03:28:28,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +29: [2023-05-13 03:28:28,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +18: [2023-05-13 03:28:28,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +16: [2023-05-13 03:28:28,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +16: [2023-05-13 03:28:28,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +18: [2023-05-13 03:28:28,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +18: [2023-05-13 03:28:28,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +16: [2023-05-13 03:28:28,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +16: [2023-05-13 03:28:28,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +16: [2023-05-13 03:28:28,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +16: [2023-05-13 03:28:28,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +16: [2023-05-13 03:28:28,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +16: [2023-05-13 03:28:28,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +29: [2023-05-13 03:28:28,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +16: [2023-05-13 03:28:28,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +16: [2023-05-13 03:28:28,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +15: [2023-05-13 03:28:28,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +16: [2023-05-13 03:28:28,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +16: [2023-05-13 03:28:28,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +16: [2023-05-13 03:28:28,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +16: [2023-05-13 03:28:28,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +16: [2023-05-13 03:28:28,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +16: [2023-05-13 03:28:28,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +27: [2023-05-13 03:28:28,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +29: [2023-05-13 03:28:28,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +25: [2023-05-13 03:28:28,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +25: [2023-05-13 03:28:28,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +19: [2023-05-13 03:28:28,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +25: [2023-05-13 03:28:28,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +25: [2023-05-13 03:28:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +25: [2023-05-13 03:28:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +25: [2023-05-13 03:28:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +25: [2023-05-13 03:28:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +25: [2023-05-13 03:28:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +15: [2023-05-13 03:28:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +15: [2023-05-13 03:28:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +15: [2023-05-13 03:28:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +15: [2023-05-13 03:28:28,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +15: [2023-05-13 03:28:28,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +15: [2023-05-13 03:28:28,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +15: [2023-05-13 03:28:28,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +29: [2023-05-13 03:28:28,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +29: [2023-05-13 03:28:28,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +19: [2023-05-13 03:28:28,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +19: [2023-05-13 03:28:28,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +29: [2023-05-13 03:28:28,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +25: [2023-05-13 03:28:28,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:28,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:28,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +27: [2023-05-13 03:28:28,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +25: [2023-05-13 03:28:28,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:28,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:28,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:28,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +29: [2023-05-13 03:28:28,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +29: [2023-05-13 03:28:28,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +25: [2023-05-13 03:28:28,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +19: [2023-05-13 03:28:28,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +19: [2023-05-13 03:28:28,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +19: [2023-05-13 03:28:28,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +19: [2023-05-13 03:28:28,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +19: [2023-05-13 03:28:28,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +29: [2023-05-13 03:28:28,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +29: [2023-05-13 03:28:28,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +27: [2023-05-13 03:28:28,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +20: [2023-05-13 03:28:28,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +20: [2023-05-13 03:28:28,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +24: [2023-05-13 03:28:28,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +24: [2023-05-13 03:28:28,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +19: [2023-05-13 03:28:28,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +29: [2023-05-13 03:28:28,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +27: [2023-05-13 03:28:28,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +24: [2023-05-13 03:28:28,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +19: [2023-05-13 03:28:28,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +19: [2023-05-13 03:28:28,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +29: [2023-05-13 03:28:28,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +27: [2023-05-13 03:28:28,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +15: [2023-05-13 03:28:28,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +24: [2023-05-13 03:28:28,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +24: [2023-05-13 03:28:28,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +24: [2023-05-13 03:28:28,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +24: [2023-05-13 03:28:28,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +15: [2023-05-13 03:28:28,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +20: [2023-05-13 03:28:28,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +24: [2023-05-13 03:28:28,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +19: [2023-05-13 03:28:28,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +19: [2023-05-13 03:28:28,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +15: [2023-05-13 03:28:28,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +15: [2023-05-13 03:28:28,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +20: [2023-05-13 03:28:28,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +29: [2023-05-13 03:28:28,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +27: [2023-05-13 03:28:28,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +27: [2023-05-13 03:28:28,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +27: [2023-05-13 03:28:28,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +27: [2023-05-13 03:28:28,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +27: [2023-05-13 03:28:28,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +15: [2023-05-13 03:28:28,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +15: [2023-05-13 03:28:28,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +15: [2023-05-13 03:28:28,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +29: [2023-05-13 03:28:28,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +19: [2023-05-13 03:28:28,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +16: [2023-05-13 03:28:28,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +16: [2023-05-13 03:28:28,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +16: [2023-05-13 03:28:28,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +19: [2023-05-13 03:28:28,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +19: [2023-05-13 03:28:28,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +21: [2023-05-13 03:28:28,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +21: [2023-05-13 03:28:28,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +29: [2023-05-13 03:28:28,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +21: [2023-05-13 03:28:28,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +21: [2023-05-13 03:28:28,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +21: [2023-05-13 03:28:28,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +21: [2023-05-13 03:28:28,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +21: [2023-05-13 03:28:28,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +26: [2023-05-13 03:28:28,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +26: [2023-05-13 03:28:28,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +21: [2023-05-13 03:28:28,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +26: [2023-05-13 03:28:28,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +26: [2023-05-13 03:28:28,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +26: [2023-05-13 03:28:28,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +26: [2023-05-13 03:28:28,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +26: [2023-05-13 03:28:28,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +26: [2023-05-13 03:28:28,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +29: [2023-05-13 03:28:28,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +20: [2023-05-13 03:28:28,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +20: [2023-05-13 03:28:28,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +20: [2023-05-13 03:28:28,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +21: [2023-05-13 03:28:28,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +16: [2023-05-13 03:28:28,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +16: [2023-05-13 03:28:28,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +16: [2023-05-13 03:28:28,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +16: [2023-05-13 03:28:28,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +21: [2023-05-13 03:28:28,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +20: [2023-05-13 03:28:28,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +20: [2023-05-13 03:28:28,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +24: [2023-05-13 03:28:28,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +21: [2023-05-13 03:28:28,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:28,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +26: [2023-05-13 03:28:28,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +26: [2023-05-13 03:28:28,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +26: [2023-05-13 03:28:28,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +20: [2023-05-13 03:28:28,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +16: [2023-05-13 03:28:28,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +27: [2023-05-13 03:28:28,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +21: [2023-05-13 03:28:28,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +21: [2023-05-13 03:28:28,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +21: [2023-05-13 03:28:28,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +26: [2023-05-13 03:28:28,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +26: [2023-05-13 03:28:28,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +26: [2023-05-13 03:28:28,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +21: [2023-05-13 03:28:28,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +21: [2023-05-13 03:28:28,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:28,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +26: [2023-05-13 03:28:28,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +26: [2023-05-13 03:28:28,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +24: [2023-05-13 03:28:28,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +25: [2023-05-13 03:28:28,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +25: [2023-05-13 03:28:28,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +20: [2023-05-13 03:28:28,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +24: [2023-05-13 03:28:28,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +20: [2023-05-13 03:28:28,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +24: [2023-05-13 03:28:28,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +16: [2023-05-13 03:28:28,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +16: [2023-05-13 03:28:28,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +24: [2023-05-13 03:28:28,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +16: [2023-05-13 03:28:28,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +24: [2023-05-13 03:28:28,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +24: [2023-05-13 03:28:28,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +25: [2023-05-13 03:28:28,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +25: [2023-05-13 03:28:28,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +25: [2023-05-13 03:28:28,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +25: [2023-05-13 03:28:28,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +25: [2023-05-13 03:28:28,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +27: [2023-05-13 03:28:28,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +27: [2023-05-13 03:28:28,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +16: [2023-05-13 03:28:28,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +27: [2023-05-13 03:28:28,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +27: [2023-05-13 03:28:28,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +25: [2023-05-13 03:28:28,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +16: [2023-05-13 03:28:28,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +16: [2023-05-13 03:28:28,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +16: [2023-05-13 03:28:28,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +20: [2023-05-13 03:28:28,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +27: [2023-05-13 03:28:28,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt... +20: [2023-05-13 03:28:28,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +16: [2023-05-13 03:28:28,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +20: [2023-05-13 03:28:28,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +20: [2023-05-13 03:28:28,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +25: [2023-05-13 03:28:28,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +25: [2023-05-13 03:28:28,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +21: [2023-05-13 03:28:28,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +25: [2023-05-13 03:28:28,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +25: [2023-05-13 03:28:28,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +25: [2023-05-13 03:28:28,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +25: [2023-05-13 03:28:28,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +25: [2023-05-13 03:28:28,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +26: [2023-05-13 03:28:28,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +26: [2023-05-13 03:28:28,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +26: [2023-05-13 03:28:28,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +21: [2023-05-13 03:28:28,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +21: [2023-05-13 03:28:28,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +21: [2023-05-13 03:28:28,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +21: [2023-05-13 03:28:28,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +21: [2023-05-13 03:28:28,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +26: [2023-05-13 03:28:28,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +26: [2023-05-13 03:28:28,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +26: [2023-05-13 03:28:28,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +21: [2023-05-13 03:28:28,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +21: [2023-05-13 03:28:28,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +21: [2023-05-13 03:28:28,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +26: [2023-05-13 03:28:28,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +26: [2023-05-13 03:28:28,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +21: [2023-05-13 03:28:28,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +21: [2023-05-13 03:28:28,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +26: [2023-05-13 03:28:28,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +26: [2023-05-13 03:28:28,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +26: [2023-05-13 03:28:28,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +21: [2023-05-13 03:28:28,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +26: [2023-05-13 03:28:28,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +21: [2023-05-13 03:28:28,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +26: [2023-05-13 03:28:28,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +26: [2023-05-13 03:28:28,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +21: [2023-05-13 03:28:28,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +21: [2023-05-13 03:28:28,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +21: [2023-05-13 03:28:28,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. +26: [2023-05-13 03:28:28,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +26: [2023-05-13 03:28:28,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_17-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +28: [2023-05-13 03:28:28,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +28: [2023-05-13 03:28:28,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +28: [2023-05-13 03:28:28,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +28: [2023-05-13 03:28:28,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +28: [2023-05-13 03:28:28,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +28: [2023-05-13 03:28:28,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +28: [2023-05-13 03:28:28,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +28: [2023-05-13 03:28:28,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +28: [2023-05-13 03:28:28,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +28: [2023-05-13 03:28:28,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +28: [2023-05-13 03:28:28,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +28: [2023-05-13 03:28:28,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +28: [2023-05-13 03:28:28,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +28: [2023-05-13 03:28:28,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +28: [2023-05-13 03:28:28,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +28: [2023-05-13 03:28:28,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +28: [2023-05-13 03:28:28,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +14: [2023-05-13 03:28:28,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +14: [2023-05-13 03:28:28,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +14: [2023-05-13 03:28:28,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +14: [2023-05-13 03:28:28,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +14: [2023-05-13 03:28:28,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +12: [2023-05-13 03:28:28,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +12: [2023-05-13 03:28:28,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +12: [2023-05-13 03:28:28,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +12: [2023-05-13 03:28:28,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +12: [2023-05-13 03:28:28,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +14: [2023-05-13 03:28:28,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +14: [2023-05-13 03:28:28,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +14: [2023-05-13 03:28:28,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +12: [2023-05-13 03:28:28,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +12: [2023-05-13 03:28:28,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +12: [2023-05-13 03:28:28,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +29: [2023-05-13 03:28:28,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +29: [2023-05-13 03:28:28,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +14: [2023-05-13 03:28:28,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +14: [2023-05-13 03:28:28,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +12: [2023-05-13 03:28:28,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +12: [2023-05-13 03:28:28,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +12: [2023-05-13 03:28:28,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +12: [2023-05-13 03:28:28,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +12: [2023-05-13 03:28:28,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +14: [2023-05-13 03:28:28,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +14: [2023-05-13 03:28:28,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +12: [2023-05-13 03:28:28,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +14: [2023-05-13 03:28:28,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +14: [2023-05-13 03:28:28,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +12: [2023-05-13 03:28:28,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +12: [2023-05-13 03:28:28,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +29: [2023-05-13 03:28:28,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +29: [2023-05-13 03:28:28,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +29: [2023-05-13 03:28:28,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +29: [2023-05-13 03:28:28,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +29: [2023-05-13 03:28:28,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +29: [2023-05-13 03:28:28,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +13: [2023-05-13 03:28:28,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +13: [2023-05-13 03:28:28,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +13: [2023-05-13 03:28:28,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +13: [2023-05-13 03:28:28,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +14: [2023-05-13 03:28:28,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +13: [2023-05-13 03:28:28,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +13: [2023-05-13 03:28:28,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +13: [2023-05-13 03:28:28,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +28: [2023-05-13 03:28:28,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +14: [2023-05-13 03:28:28,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +13: [2023-05-13 03:28:28,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +29: [2023-05-13 03:28:28,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +29: [2023-05-13 03:28:28,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +11: [2023-05-13 03:28:28,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +11: [2023-05-13 03:28:28,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +11: [2023-05-13 03:28:28,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +11: [2023-05-13 03:28:28,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +11: [2023-05-13 03:28:28,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +11: [2023-05-13 03:28:28,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +11: [2023-05-13 03:28:28,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +11: [2023-05-13 03:28:28,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +10: [2023-05-13 03:28:28,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +10: [2023-05-13 03:28:28,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +23: [2023-05-13 03:28:28,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +23: [2023-05-13 03:28:28,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +10: [2023-05-13 03:28:28,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +10: [2023-05-13 03:28:28,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +10: [2023-05-13 03:28:28,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +10: [2023-05-13 03:28:28,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +23: [2023-05-13 03:28:28,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +23: [2023-05-13 03:28:28,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +10: [2023-05-13 03:28:28,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +10: [2023-05-13 03:28:28,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +23: [2023-05-13 03:28:28,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +23: [2023-05-13 03:28:28,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +23: [2023-05-13 03:28:28,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +23: [2023-05-13 03:28:28,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +11: [2023-05-13 03:28:28,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +13: [2023-05-13 03:28:28,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +13: [2023-05-13 03:28:28,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +13: [2023-05-13 03:28:28,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +10: [2023-05-13 03:28:28,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +13: [2023-05-13 03:28:28,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +13: [2023-05-13 03:28:28,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +10: [2023-05-13 03:28:28,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +13: [2023-05-13 03:28:28,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +13: [2023-05-13 03:28:28,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +29: [2023-05-13 03:28:28,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +13: [2023-05-13 03:28:28,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +29: [2023-05-13 03:28:28,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +23: [2023-05-13 03:28:28,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +29: [2023-05-13 03:28:28,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +23: [2023-05-13 03:28:28,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +29: [2023-05-13 03:28:28,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +11: [2023-05-13 03:28:28,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +29: [2023-05-13 03:28:28,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +29: [2023-05-13 03:28:28,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +10: [2023-05-13 03:28:28,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +10: [2023-05-13 03:28:28,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +10: [2023-05-13 03:28:28,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +10: [2023-05-13 03:28:28,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +10: [2023-05-13 03:28:28,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +11: [2023-05-13 03:28:28,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +10: [2023-05-13 03:28:28,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +23: [2023-05-13 03:28:28,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +23: [2023-05-13 03:28:28,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +11: [2023-05-13 03:28:28,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +23: [2023-05-13 03:28:28,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +23: [2023-05-13 03:28:28,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +23: [2023-05-13 03:28:28,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +11: [2023-05-13 03:28:28,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +28: [2023-05-13 03:28:28,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +28: [2023-05-13 03:28:28,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +28: [2023-05-13 03:28:28,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +11: [2023-05-13 03:28:28,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +23: [2023-05-13 03:28:28,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +11: [2023-05-13 03:28:28,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +11: [2023-05-13 03:28:28,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +28: [2023-05-13 03:28:28,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +28: [2023-05-13 03:28:28,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +28: [2023-05-13 03:28:28,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +28: [2023-05-13 03:28:28,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +24: [2023-05-13 03:28:28,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +24: [2023-05-13 03:28:28,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +24: [2023-05-13 03:28:28,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +24: [2023-05-13 03:28:28,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +24: [2023-05-13 03:28:28,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +18: [2023-05-13 03:28:28,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +18: [2023-05-13 03:28:28,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +24: [2023-05-13 03:28:28,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +24: [2023-05-13 03:28:28,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +24: [2023-05-13 03:28:28,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +18: [2023-05-13 03:28:28,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +18: [2023-05-13 03:28:28,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +18: [2023-05-13 03:28:28,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +18: [2023-05-13 03:28:28,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +18: [2023-05-13 03:28:28,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +18: [2023-05-13 03:28:28,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +22: [2023-05-13 03:28:28,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +22: [2023-05-13 03:28:28,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +22: [2023-05-13 03:28:28,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +22: [2023-05-13 03:28:28,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +22: [2023-05-13 03:28:28,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +22: [2023-05-13 03:28:28,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +22: [2023-05-13 03:28:28,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +22: [2023-05-13 03:28:28,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +30: [2023-05-13 03:28:28,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +30: [2023-05-13 03:28:28,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +30: [2023-05-13 03:28:28,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +30: [2023-05-13 03:28:28,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +30: [2023-05-13 03:28:28,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +30: [2023-05-13 03:28:28,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +30: [2023-05-13 03:28:28,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +30: [2023-05-13 03:28:28,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +18: [2023-05-13 03:28:28,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +18: [2023-05-13 03:28:28,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +18: [2023-05-13 03:28:28,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +24: [2023-05-13 03:28:28,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +24: [2023-05-13 03:28:28,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +24: [2023-05-13 03:28:28,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +24: [2023-05-13 03:28:28,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +24: [2023-05-13 03:28:28,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +22: [2023-05-13 03:28:28,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +24: [2023-05-13 03:28:28,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +22: [2023-05-13 03:28:28,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +24: [2023-05-13 03:28:28,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +18: [2023-05-13 03:28:28,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +18: [2023-05-13 03:28:28,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +24: [2023-05-13 03:28:28,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +18: [2023-05-13 03:28:28,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +18: [2023-05-13 03:28:28,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +18: [2023-05-13 03:28:28,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +30: [2023-05-13 03:28:28,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +30: [2023-05-13 03:28:28,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +30: [2023-05-13 03:28:28,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +30: [2023-05-13 03:28:28,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +30: [2023-05-13 03:28:28,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +22: [2023-05-13 03:28:28,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +22: [2023-05-13 03:28:28,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +30: [2023-05-13 03:28:28,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +30: [2023-05-13 03:28:28,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +22: [2023-05-13 03:28:28,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +30: [2023-05-13 03:28:28,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +22: [2023-05-13 03:28:28,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +22: [2023-05-13 03:28:28,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +22: [2023-05-13 03:28:28,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +28: [2023-05-13 03:28:28,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +12: [2023-05-13 03:28:28,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +14: [2023-05-13 03:28:28,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +14: [2023-05-13 03:28:28,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +28: [2023-05-13 03:28:28,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +29: [2023-05-13 03:28:28,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +29: [2023-05-13 03:28:28,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +12: [2023-05-13 03:28:28,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +14: [2023-05-13 03:28:28,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +28: [2023-05-13 03:28:28,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +12: [2023-05-13 03:28:28,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +28: [2023-05-13 03:28:28,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +13: [2023-05-13 03:28:28,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +25: [2023-05-13 03:28:28,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +25: [2023-05-13 03:28:28,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +25: [2023-05-13 03:28:28,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +25: [2023-05-13 03:28:28,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +25: [2023-05-13 03:28:28,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +25: [2023-05-13 03:28:28,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +25: [2023-05-13 03:28:28,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +25: [2023-05-13 03:28:28,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +28: [2023-05-13 03:28:28,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +11: [2023-05-13 03:28:28,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +10: [2023-05-13 03:28:28,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +10: [2023-05-13 03:28:28,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +28: [2023-05-13 03:28:28,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +28: [2023-05-13 03:28:28,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +25: [2023-05-13 03:28:28,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +25: [2023-05-13 03:28:28,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +25: [2023-05-13 03:28:28,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +23: [2023-05-13 03:28:28,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +23: [2023-05-13 03:28:28,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +13: [2023-05-13 03:28:28,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +12: [2023-05-13 03:28:28,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +12: [2023-05-13 03:28:28,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +12: [2023-05-13 03:28:28,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +12: [2023-05-13 03:28:28,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +12: [2023-05-13 03:28:28,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +14: [2023-05-13 03:28:28,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +14: [2023-05-13 03:28:28,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +14: [2023-05-13 03:28:28,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +14: [2023-05-13 03:28:28,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +14: [2023-05-13 03:28:28,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +25: [2023-05-13 03:28:28,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +25: [2023-05-13 03:28:28,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +13: [2023-05-13 03:28:28,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +25: [2023-05-13 03:28:28,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +25: [2023-05-13 03:28:28,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +25: [2023-05-13 03:28:28,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +15: [2023-05-13 03:28:28,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +15: [2023-05-13 03:28:28,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +15: [2023-05-13 03:28:28,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +15: [2023-05-13 03:28:28,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +15: [2023-05-13 03:28:28,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +15: [2023-05-13 03:28:28,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +15: [2023-05-13 03:28:28,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +15: [2023-05-13 03:28:28,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +29: [2023-05-13 03:28:28,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +10: [2023-05-13 03:28:28,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +29: [2023-05-13 03:28:28,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +13: [2023-05-13 03:28:28,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +11: [2023-05-13 03:28:28,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +29: [2023-05-13 03:28:28,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +13: [2023-05-13 03:28:28,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +13: [2023-05-13 03:28:28,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +13: [2023-05-13 03:28:28,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +13: [2023-05-13 03:28:28,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +15: [2023-05-13 03:28:28,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +12: [2023-05-13 03:28:28,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +14: [2023-05-13 03:28:28,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +31: [2023-05-13 03:28:28,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +31: [2023-05-13 03:28:28,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +31: [2023-05-13 03:28:28,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +31: [2023-05-13 03:28:28,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +31: [2023-05-13 03:28:28,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +31: [2023-05-13 03:28:28,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +31: [2023-05-13 03:28:28,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +11: [2023-05-13 03:28:28,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +13: [2023-05-13 03:28:28,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +22: [2023-05-13 03:28:28,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +31: [2023-05-13 03:28:28,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +29: [2023-05-13 03:28:28,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +29: [2023-05-13 03:28:28,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +12: [2023-05-13 03:28:28,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +14: [2023-05-13 03:28:28,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +10: [2023-05-13 03:28:28,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +14: [2023-05-13 03:28:28,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +10: [2023-05-13 03:28:28,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +31: [2023-05-13 03:28:28,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +15: [2023-05-13 03:28:28,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +31: [2023-05-13 03:28:28,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +15: [2023-05-13 03:28:28,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +15: [2023-05-13 03:28:28,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +15: [2023-05-13 03:28:28,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +17: [2023-05-13 03:28:28,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +18: [2023-05-13 03:28:28,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +18: [2023-05-13 03:28:28,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +18: [2023-05-13 03:28:28,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +12: [2023-05-13 03:28:28,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +15: [2023-05-13 03:28:28,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +15: [2023-05-13 03:28:28,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +17: [2023-05-13 03:28:28,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +15: [2023-05-13 03:28:28,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +17: [2023-05-13 03:28:28,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +17: [2023-05-13 03:28:28,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +17: [2023-05-13 03:28:28,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +17: [2023-05-13 03:28:28,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +17: [2023-05-13 03:28:28,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +17: [2023-05-13 03:28:28,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +13: [2023-05-13 03:28:28,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +24: [2023-05-13 03:28:28,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +24: [2023-05-13 03:28:28,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +23: [2023-05-13 03:28:28,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +23: [2023-05-13 03:28:28,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +27: [2023-05-13 03:28:28,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +24: [2023-05-13 03:28:28,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +27: [2023-05-13 03:28:28,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +27: [2023-05-13 03:28:28,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +23: [2023-05-13 03:28:28,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +27: [2023-05-13 03:28:28,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +27: [2023-05-13 03:28:28,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +27: [2023-05-13 03:28:28,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +27: [2023-05-13 03:28:28,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +29: [2023-05-13 03:28:28,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +29: [2023-05-13 03:28:28,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +29: [2023-05-13 03:28:28,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +27: [2023-05-13 03:28:28,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +18: [2023-05-13 03:28:28,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +11: [2023-05-13 03:28:28,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +23: [2023-05-13 03:28:28,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +17: [2023-05-13 03:28:28,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +31: [2023-05-13 03:28:28,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +31: [2023-05-13 03:28:28,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +23: [2023-05-13 03:28:28,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +23: [2023-05-13 03:28:28,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +23: [2023-05-13 03:28:28,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +31: [2023-05-13 03:28:28,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +31: [2023-05-13 03:28:28,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +22: [2023-05-13 03:28:28,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +30: [2023-05-13 03:28:28,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +30: [2023-05-13 03:28:28,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +30: [2023-05-13 03:28:28,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +31: [2023-05-13 03:28:28,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +31: [2023-05-13 03:28:28,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +19: [2023-05-13 03:28:28,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +19: [2023-05-13 03:28:28,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +30: [2023-05-13 03:28:28,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +27: [2023-05-13 03:28:28,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +20: [2023-05-13 03:28:28,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +20: [2023-05-13 03:28:28,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +19: [2023-05-13 03:28:28,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +24: [2023-05-13 03:28:28,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +24: [2023-05-13 03:28:28,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +19: [2023-05-13 03:28:28,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +19: [2023-05-13 03:28:28,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +19: [2023-05-13 03:28:28,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +19: [2023-05-13 03:28:28,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +12: [2023-05-13 03:28:28,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +19: [2023-05-13 03:28:28,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +10: [2023-05-13 03:28:28,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +10: [2023-05-13 03:28:28,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +10: [2023-05-13 03:28:28,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +10: [2023-05-13 03:28:28,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +10: [2023-05-13 03:28:28,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +12: [2023-05-13 03:28:28,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +10: [2023-05-13 03:28:28,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +13: [2023-05-13 03:28:28,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +23: [2023-05-13 03:28:28,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +24: [2023-05-13 03:28:28,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +29: [2023-05-13 03:28:28,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +20: [2023-05-13 03:28:28,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +20: [2023-05-13 03:28:28,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +20: [2023-05-13 03:28:28,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +20: [2023-05-13 03:28:28,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +20: [2023-05-13 03:28:28,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +20: [2023-05-13 03:28:28,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +14: [2023-05-13 03:28:28,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +19: [2023-05-13 03:28:28,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +19: [2023-05-13 03:28:28,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +20: [2023-05-13 03:28:28,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +17: [2023-05-13 03:28:28,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +17: [2023-05-13 03:28:28,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +27: [2023-05-13 03:28:28,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +20: [2023-05-13 03:28:28,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +19: [2023-05-13 03:28:28,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +30: [2023-05-13 03:28:28,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +17: [2023-05-13 03:28:28,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +14: [2023-05-13 03:28:28,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +12: [2023-05-13 03:28:28,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +12: [2023-05-13 03:28:28,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +17: [2023-05-13 03:28:28,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +12: [2023-05-13 03:28:28,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +11: [2023-05-13 03:28:28,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +11: [2023-05-13 03:28:28,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +14: [2023-05-13 03:28:28,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +27: [2023-05-13 03:28:28,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +19: [2023-05-13 03:28:28,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +27: [2023-05-13 03:28:28,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +14: [2023-05-13 03:28:28,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +27: [2023-05-13 03:28:28,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +14: [2023-05-13 03:28:28,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +17: [2023-05-13 03:28:28,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +17: [2023-05-13 03:28:28,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +18: [2023-05-13 03:28:28,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +18: [2023-05-13 03:28:28,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +18: [2023-05-13 03:28:28,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +18: [2023-05-13 03:28:28,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +27: [2023-05-13 03:28:28,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +17: [2023-05-13 03:28:28,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +11: [2023-05-13 03:28:28,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +11: [2023-05-13 03:28:28,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +11: [2023-05-13 03:28:28,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +27: [2023-05-13 03:28:28,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +11: [2023-05-13 03:28:28,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +27: [2023-05-13 03:28:28,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +24: [2023-05-13 03:28:28,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 7: [2023-05-13 03:28:28,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +19: [2023-05-13 03:28:28,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +19: [2023-05-13 03:28:28,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +19: [2023-05-13 03:28:28,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +19: [2023-05-13 03:28:28,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 7: [2023-05-13 03:28:28,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +30: [2023-05-13 03:28:28,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +30: [2023-05-13 03:28:28,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +30: [2023-05-13 03:28:28,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +22: [2023-05-13 03:28:28,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +20: [2023-05-13 03:28:28,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +13: [2023-05-13 03:28:28,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +13: [2023-05-13 03:28:28,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +13: [2023-05-13 03:28:28,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +13: [2023-05-13 03:28:28,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +20: [2023-05-13 03:28:28,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +20: [2023-05-13 03:28:28,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +20: [2023-05-13 03:28:28,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +13: [2023-05-13 03:28:28,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +29: [2023-05-13 03:28:28,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +20: [2023-05-13 03:28:28,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +22: [2023-05-13 03:28:28,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +18: [2023-05-13 03:28:28,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +22: [2023-05-13 03:28:28,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 0: [2023-05-13 03:28:28,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +20: [2023-05-13 03:28:28,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +29: [2023-05-13 03:28:28,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +18: [2023-05-13 03:28:28,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +24: [2023-05-13 03:28:28,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +22: [2023-05-13 03:28:28,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +22: [2023-05-13 03:28:28,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +22: [2023-05-13 03:28:28,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +22: [2023-05-13 03:28:28,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +18: [2023-05-13 03:28:28,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 0: [2023-05-13 03:28:28,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +24: [2023-05-13 03:28:28,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +24: [2023-05-13 03:28:28,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +30: [2023-05-13 03:28:28,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +18: [2023-05-13 03:28:28,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +11: [2023-05-13 03:28:28,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +22: [2023-05-13 03:28:28,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +24: [2023-05-13 03:28:28,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +29: [2023-05-13 03:28:28,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +29: [2023-05-13 03:28:28,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +29: [2023-05-13 03:28:28,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 8: [2023-05-13 03:28:28,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +24: [2023-05-13 03:28:28,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +23: [2023-05-13 03:28:28,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +23: [2023-05-13 03:28:28,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +25: [2023-05-13 03:28:28,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +25: [2023-05-13 03:28:28,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +25: [2023-05-13 03:28:28,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +21: [2023-05-13 03:28:28,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +21: [2023-05-13 03:28:28,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +23: [2023-05-13 03:28:28,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +30: [2023-05-13 03:28:28,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +24: [2023-05-13 03:28:28,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +16: [2023-05-13 03:28:28,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +16: [2023-05-13 03:28:28,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +10: [2023-05-13 03:28:28,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +10: [2023-05-13 03:28:28,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +10: [2023-05-13 03:28:28,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +23: [2023-05-13 03:28:28,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +10: [2023-05-13 03:28:28,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +24: [2023-05-13 03:28:28,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +10: [2023-05-13 03:28:28,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +30: [2023-05-13 03:28:28,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +30: [2023-05-13 03:28:28,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +21: [2023-05-13 03:28:28,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +21: [2023-05-13 03:28:28,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +21: [2023-05-13 03:28:28,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +21: [2023-05-13 03:28:28,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +21: [2023-05-13 03:28:28,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +21: [2023-05-13 03:28:28,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +31: [2023-05-13 03:28:28,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +21: [2023-05-13 03:28:28,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +21: [2023-05-13 03:28:28,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +16: [2023-05-13 03:28:28,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +16: [2023-05-13 03:28:28,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +16: [2023-05-13 03:28:28,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +16: [2023-05-13 03:28:28,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +16: [2023-05-13 03:28:28,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +16: [2023-05-13 03:28:28,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +23: [2023-05-13 03:28:28,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +23: [2023-05-13 03:28:28,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +16: [2023-05-13 03:28:28,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +18: [2023-05-13 03:28:28,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +24: [2023-05-13 03:28:28,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +21: [2023-05-13 03:28:28,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +16: [2023-05-13 03:28:28,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +16: [2023-05-13 03:28:28,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +18: [2023-05-13 03:28:28,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +15: [2023-05-13 03:28:28,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +25: [2023-05-13 03:28:28,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +30: [2023-05-13 03:28:28,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +18: [2023-05-13 03:28:28,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +18: [2023-05-13 03:28:28,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +25: [2023-05-13 03:28:28,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +25: [2023-05-13 03:28:28,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +25: [2023-05-13 03:28:28,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +25: [2023-05-13 03:28:28,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +16: [2023-05-13 03:28:28,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +16: [2023-05-13 03:28:28,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +16: [2023-05-13 03:28:28,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +21: [2023-05-13 03:28:28,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +16: [2023-05-13 03:28:28,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +21: [2023-05-13 03:28:28,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +16: [2023-05-13 03:28:28,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +21: [2023-05-13 03:28:28,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +11: [2023-05-13 03:28:28,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +21: [2023-05-13 03:28:28,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +11: [2023-05-13 03:28:28,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +21: [2023-05-13 03:28:28,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +11: [2023-05-13 03:28:28,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +30: [2023-05-13 03:28:28,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +30: [2023-05-13 03:28:28,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +11: [2023-05-13 03:28:28,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +11: [2023-05-13 03:28:28,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +30: [2023-05-13 03:28:28,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +24: [2023-05-13 03:28:28,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +22: [2023-05-13 03:28:28,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +31: [2023-05-13 03:28:28,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +17: [2023-05-13 03:28:28,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +22: [2023-05-13 03:28:28,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +22: [2023-05-13 03:28:28,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +27: [2023-05-13 03:28:28,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +31: [2023-05-13 03:28:28,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +25: [2023-05-13 03:28:28,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +25: [2023-05-13 03:28:28,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +25: [2023-05-13 03:28:28,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +22: [2023-05-13 03:28:28,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +22: [2023-05-13 03:28:28,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +22: [2023-05-13 03:28:28,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +15: [2023-05-13 03:28:28,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +15: [2023-05-13 03:28:28,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +20: [2023-05-13 03:28:28,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +20: [2023-05-13 03:28:28,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +19: [2023-05-13 03:28:28,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +19: [2023-05-13 03:28:28,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +19: [2023-05-13 03:28:28,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +19: [2023-05-13 03:28:28,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +17: [2023-05-13 03:28:28,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 8: [2023-05-13 03:28:28,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +31: [2023-05-13 03:28:28,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +25: [2023-05-13 03:28:28,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +31: [2023-05-13 03:28:28,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +31: [2023-05-13 03:28:28,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +31: [2023-05-13 03:28:28,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +31: [2023-05-13 03:28:28,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +31: [2023-05-13 03:28:28,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +31: [2023-05-13 03:28:28,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +25: [2023-05-13 03:28:28,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +25: [2023-05-13 03:28:28,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +15: [2023-05-13 03:28:28,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +15: [2023-05-13 03:28:28,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +15: [2023-05-13 03:28:28,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +15: [2023-05-13 03:28:28,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +25: [2023-05-13 03:28:28,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +15: [2023-05-13 03:28:28,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +25: [2023-05-13 03:28:28,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +27: [2023-05-13 03:28:28,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +20: [2023-05-13 03:28:28,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +15: [2023-05-13 03:28:28,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 4: [2023-05-13 03:28:28,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 4: [2023-05-13 03:28:28,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +27: [2023-05-13 03:28:28,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +15: [2023-05-13 03:28:28,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +19: [2023-05-13 03:28:28,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +27: [2023-05-13 03:28:28,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +27: [2023-05-13 03:28:28,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +19: [2023-05-13 03:28:28,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +19: [2023-05-13 03:28:28,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +19: [2023-05-13 03:28:28,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 2: [2023-05-13 03:28:28,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 9: [2023-05-13 03:28:28,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +17: [2023-05-13 03:28:28,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +17: [2023-05-13 03:28:28,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +17: [2023-05-13 03:28:28,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 9: [2023-05-13 03:28:28,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +17: [2023-05-13 03:28:28,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +17: [2023-05-13 03:28:28,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +17: [2023-05-13 03:28:28,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +20: [2023-05-13 03:28:28,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +26: [2023-05-13 03:28:28,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +26: [2023-05-13 03:28:28,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +19: [2023-05-13 03:28:28,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +16: [2023-05-13 03:28:28,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +26: [2023-05-13 03:28:28,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +26: [2023-05-13 03:28:28,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +26: [2023-05-13 03:28:28,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +26: [2023-05-13 03:28:28,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +26: [2023-05-13 03:28:28,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +26: [2023-05-13 03:28:28,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +20: [2023-05-13 03:28:28,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +20: [2023-05-13 03:28:28,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +20: [2023-05-13 03:28:28,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +21: [2023-05-13 03:28:28,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +20: [2023-05-13 03:28:28,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +16: [2023-05-13 03:28:28,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +19: [2023-05-13 03:28:28,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +19: [2023-05-13 03:28:28,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +26: [2023-05-13 03:28:28,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +26: [2023-05-13 03:28:28,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +21: [2023-05-13 03:28:28,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +21: [2023-05-13 03:28:28,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +26: [2023-05-13 03:28:28,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +19: [2023-05-13 03:28:28,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +26: [2023-05-13 03:28:28,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +26: [2023-05-13 03:28:28,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +26: [2023-05-13 03:28:28,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +21: [2023-05-13 03:28:28,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +27: [2023-05-13 03:28:28,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +27: [2023-05-13 03:28:28,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +27: [2023-05-13 03:28:28,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +27: [2023-05-13 03:28:28,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +26: [2023-05-13 03:28:28,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... +26: [2023-05-13 03:28:28,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +20: [2023-05-13 03:28:28,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 5: [2023-05-13 03:28:28,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +16: [2023-05-13 03:28:28,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +16: [2023-05-13 03:28:28,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +20: [2023-05-13 03:28:28,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +16: [2023-05-13 03:28:28,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +16: [2023-05-13 03:28:28,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +20: [2023-05-13 03:28:28,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +16: [2023-05-13 03:28:28,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 1: [2023-05-13 03:28:28,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +16: [2023-05-13 03:28:28,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +15: [2023-05-13 03:28:28,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +15: [2023-05-13 03:28:28,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +15: [2023-05-13 03:28:28,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +15: [2023-05-13 03:28:28,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 1: [2023-05-13 03:28:28,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +21: [2023-05-13 03:28:28,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 2: [2023-05-13 03:28:28,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +21: [2023-05-13 03:28:28,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +21: [2023-05-13 03:28:28,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +31: [2023-05-13 03:28:28,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +31: [2023-05-13 03:28:28,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +21: [2023-05-13 03:28:28,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +31: [2023-05-13 03:28:28,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +15: [2023-05-13 03:28:28,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +15: [2023-05-13 03:28:28,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +31: [2023-05-13 03:28:28,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +21: [2023-05-13 03:28:28,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +31: [2023-05-13 03:28:28,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +31: [2023-05-13 03:28:28,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +19: [2023-05-13 03:28:28,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +21: [2023-05-13 03:28:28,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +27: [2023-05-13 03:28:28,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +27: [2023-05-13 03:28:28,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +16: [2023-05-13 03:28:28,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +19: [2023-05-13 03:28:28,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +19: [2023-05-13 03:28:28,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +19: [2023-05-13 03:28:28,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +27: [2023-05-13 03:28:28,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +21: [2023-05-13 03:28:28,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +20: [2023-05-13 03:28:28,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +20: [2023-05-13 03:28:28,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +20: [2023-05-13 03:28:28,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +16: [2023-05-13 03:28:28,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +21: [2023-05-13 03:28:28,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +20: [2023-05-13 03:28:28,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +17: [2023-05-13 03:28:28,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +17: [2023-05-13 03:28:28,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +17: [2023-05-13 03:28:28,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +17: [2023-05-13 03:28:28,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +17: [2023-05-13 03:28:28,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +20: [2023-05-13 03:28:28,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 5: [2023-05-13 03:28:28,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +27: [2023-05-13 03:28:28,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +16: [2023-05-13 03:28:28,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +16: [2023-05-13 03:28:28,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +16: [2023-05-13 03:28:28,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +16: [2023-05-13 03:28:28,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +16: [2023-05-13 03:28:28,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +27: [2023-05-13 03:28:28,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +27: [2023-05-13 03:28:28,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +27: [2023-05-13 03:28:28,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +16: [2023-05-13 03:28:28,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +21: [2023-05-13 03:28:28,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +21: [2023-05-13 03:28:28,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +21: [2023-05-13 03:28:28,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +21: [2023-05-13 03:28:28,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +26: [2023-05-13 03:28:28,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 3: [2023-05-13 03:28:28,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +26: [2023-05-13 03:28:28,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +26: [2023-05-13 03:28:28,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 3: [2023-05-13 03:28:28,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +26: [2023-05-13 03:28:28,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +26: [2023-05-13 03:28:28,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +26: [2023-05-13 03:28:28,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +26: [2023-05-13 03:28:28,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. +26: [2023-05-13 03:28:28,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_18-model_00-model_states.pt. + 6: [2023-05-13 03:28:28,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +26: [2023-05-13 03:28:28,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +17: [2023-05-13 03:28:28,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +17: [2023-05-13 03:28:28,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +17: [2023-05-13 03:28:28,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +26: [2023-05-13 03:28:28,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +26: [2023-05-13 03:28:28,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 6: [2023-05-13 03:28:28,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +26: [2023-05-13 03:28:28,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +26: [2023-05-13 03:28:28,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +26: [2023-05-13 03:28:28,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +26: [2023-05-13 03:28:28,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +26: [2023-05-13 03:28:28,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +28: [2023-05-13 03:28:29,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +28: [2023-05-13 03:28:29,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +28: [2023-05-13 03:28:29,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +28: [2023-05-13 03:28:29,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +28: [2023-05-13 03:28:29,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +28: [2023-05-13 03:28:29,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +28: [2023-05-13 03:28:29,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +28: [2023-05-13 03:28:29,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +28: [2023-05-13 03:28:29,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +28: [2023-05-13 03:28:29,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +28: [2023-05-13 03:28:29,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +28: [2023-05-13 03:28:29,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +28: [2023-05-13 03:28:29,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +28: [2023-05-13 03:28:29,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +28: [2023-05-13 03:28:29,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +28: [2023-05-13 03:28:29,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +14: [2023-05-13 03:28:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +14: [2023-05-13 03:28:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +14: [2023-05-13 03:28:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +14: [2023-05-13 03:28:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +14: [2023-05-13 03:28:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +14: [2023-05-13 03:28:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +14: [2023-05-13 03:28:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +14: [2023-05-13 03:28:29,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +14: [2023-05-13 03:28:29,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +14: [2023-05-13 03:28:29,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +14: [2023-05-13 03:28:29,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +14: [2023-05-13 03:28:29,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +14: [2023-05-13 03:28:29,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +14: [2023-05-13 03:28:29,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +14: [2023-05-13 03:28:29,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +14: [2023-05-13 03:28:29,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +12: [2023-05-13 03:28:29,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +12: [2023-05-13 03:28:29,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +12: [2023-05-13 03:28:29,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +12: [2023-05-13 03:28:29,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +12: [2023-05-13 03:28:29,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +12: [2023-05-13 03:28:29,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +12: [2023-05-13 03:28:29,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +12: [2023-05-13 03:28:29,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +13: [2023-05-13 03:28:29,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +13: [2023-05-13 03:28:29,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +13: [2023-05-13 03:28:29,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +13: [2023-05-13 03:28:29,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +13: [2023-05-13 03:28:29,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +13: [2023-05-13 03:28:29,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +13: [2023-05-13 03:28:29,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +13: [2023-05-13 03:28:29,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +12: [2023-05-13 03:28:29,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +12: [2023-05-13 03:28:29,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +12: [2023-05-13 03:28:29,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +12: [2023-05-13 03:28:29,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +12: [2023-05-13 03:28:29,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +12: [2023-05-13 03:28:29,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +13: [2023-05-13 03:28:29,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +13: [2023-05-13 03:28:29,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +12: [2023-05-13 03:28:29,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +12: [2023-05-13 03:28:29,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +13: [2023-05-13 03:28:29,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +13: [2023-05-13 03:28:29,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +13: [2023-05-13 03:28:29,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +13: [2023-05-13 03:28:29,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +13: [2023-05-13 03:28:29,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +13: [2023-05-13 03:28:29,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +28: [2023-05-13 03:28:29,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +28: [2023-05-13 03:28:29,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +29: [2023-05-13 03:28:29,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +29: [2023-05-13 03:28:29,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +28: [2023-05-13 03:28:29,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +29: [2023-05-13 03:28:29,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +29: [2023-05-13 03:28:29,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +29: [2023-05-13 03:28:29,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +29: [2023-05-13 03:28:29,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +29: [2023-05-13 03:28:29,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +29: [2023-05-13 03:28:29,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +29: [2023-05-13 03:28:29,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +29: [2023-05-13 03:28:29,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +29: [2023-05-13 03:28:29,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +31: [2023-05-13 03:28:29,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +31: [2023-05-13 03:28:29,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +31: [2023-05-13 03:28:29,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +31: [2023-05-13 03:28:29,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +31: [2023-05-13 03:28:29,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +31: [2023-05-13 03:28:29,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +31: [2023-05-13 03:28:29,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +31: [2023-05-13 03:28:29,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +14: [2023-05-13 03:28:29,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +14: [2023-05-13 03:28:29,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +14: [2023-05-13 03:28:29,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +31: [2023-05-13 03:28:29,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +31: [2023-05-13 03:28:29,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +29: [2023-05-13 03:28:29,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +29: [2023-05-13 03:28:29,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +14: [2023-05-13 03:28:29,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +29: [2023-05-13 03:28:29,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +29: [2023-05-13 03:28:29,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +29: [2023-05-13 03:28:29,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +31: [2023-05-13 03:28:29,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +31: [2023-05-13 03:28:29,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +28: [2023-05-13 03:28:29,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +31: [2023-05-13 03:28:29,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +31: [2023-05-13 03:28:29,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +31: [2023-05-13 03:28:29,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +31: [2023-05-13 03:28:29,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +28: [2023-05-13 03:28:29,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +28: [2023-05-13 03:28:29,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +28: [2023-05-13 03:28:29,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +20: [2023-05-13 03:28:29,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +20: [2023-05-13 03:28:29,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +14: [2023-05-13 03:28:29,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +28: [2023-05-13 03:28:29,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +28: [2023-05-13 03:28:29,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +20: [2023-05-13 03:28:29,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +20: [2023-05-13 03:28:29,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +20: [2023-05-13 03:28:29,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +20: [2023-05-13 03:28:29,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +20: [2023-05-13 03:28:29,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +20: [2023-05-13 03:28:29,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +28: [2023-05-13 03:28:29,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +14: [2023-05-13 03:28:29,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +14: [2023-05-13 03:28:29,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +14: [2023-05-13 03:28:29,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +12: [2023-05-13 03:28:29,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +20: [2023-05-13 03:28:29,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +20: [2023-05-13 03:28:29,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +12: [2023-05-13 03:28:29,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +13: [2023-05-13 03:28:29,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +13: [2023-05-13 03:28:29,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +19: [2023-05-13 03:28:29,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +19: [2023-05-13 03:28:29,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +12: [2023-05-13 03:28:29,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +13: [2023-05-13 03:28:29,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +19: [2023-05-13 03:28:29,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +19: [2023-05-13 03:28:29,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +19: [2023-05-13 03:28:29,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +19: [2023-05-13 03:28:29,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +19: [2023-05-13 03:28:29,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +19: [2023-05-13 03:28:29,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +20: [2023-05-13 03:28:29,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +18: [2023-05-13 03:28:29,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +18: [2023-05-13 03:28:29,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +18: [2023-05-13 03:28:29,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +18: [2023-05-13 03:28:29,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +18: [2023-05-13 03:28:29,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +18: [2023-05-13 03:28:29,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +18: [2023-05-13 03:28:29,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +18: [2023-05-13 03:28:29,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +20: [2023-05-13 03:28:29,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +20: [2023-05-13 03:28:29,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +10: [2023-05-13 03:28:29,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +20: [2023-05-13 03:28:29,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +10: [2023-05-13 03:28:29,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +10: [2023-05-13 03:28:29,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +13: [2023-05-13 03:28:29,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +11: [2023-05-13 03:28:29,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +10: [2023-05-13 03:28:29,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +10: [2023-05-13 03:28:29,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +10: [2023-05-13 03:28:29,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +10: [2023-05-13 03:28:29,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +10: [2023-05-13 03:28:29,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +11: [2023-05-13 03:28:29,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +11: [2023-05-13 03:28:29,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +20: [2023-05-13 03:28:29,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +11: [2023-05-13 03:28:29,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +11: [2023-05-13 03:28:29,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +11: [2023-05-13 03:28:29,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +11: [2023-05-13 03:28:29,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +20: [2023-05-13 03:28:29,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +11: [2023-05-13 03:28:29,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +24: [2023-05-13 03:28:29,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +24: [2023-05-13 03:28:29,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +24: [2023-05-13 03:28:29,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +24: [2023-05-13 03:28:29,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +24: [2023-05-13 03:28:29,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +24: [2023-05-13 03:28:29,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +24: [2023-05-13 03:28:29,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +24: [2023-05-13 03:28:29,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +14: [2023-05-13 03:28:29,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +11: [2023-05-13 03:28:29,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +18: [2023-05-13 03:28:29,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +18: [2023-05-13 03:28:29,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +18: [2023-05-13 03:28:29,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +14: [2023-05-13 03:28:29,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +14: [2023-05-13 03:28:29,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +10: [2023-05-13 03:28:29,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +10: [2023-05-13 03:28:29,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +19: [2023-05-13 03:28:29,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +19: [2023-05-13 03:28:29,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +18: [2023-05-13 03:28:29,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +19: [2023-05-13 03:28:29,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +19: [2023-05-13 03:28:29,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +12: [2023-05-13 03:28:29,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +12: [2023-05-13 03:28:29,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +12: [2023-05-13 03:28:29,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +12: [2023-05-13 03:28:29,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +12: [2023-05-13 03:28:29,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +19: [2023-05-13 03:28:29,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +14: [2023-05-13 03:28:29,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +19: [2023-05-13 03:28:29,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +18: [2023-05-13 03:28:29,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +19: [2023-05-13 03:28:29,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +19: [2023-05-13 03:28:29,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +13: [2023-05-13 03:28:29,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +18: [2023-05-13 03:28:29,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +18: [2023-05-13 03:28:29,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +18: [2023-05-13 03:28:29,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +24: [2023-05-13 03:28:29,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +24: [2023-05-13 03:28:29,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +24: [2023-05-13 03:28:29,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +10: [2023-05-13 03:28:29,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +10: [2023-05-13 03:28:29,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +24: [2023-05-13 03:28:29,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +24: [2023-05-13 03:28:29,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +10: [2023-05-13 03:28:29,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +10: [2023-05-13 03:28:29,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +24: [2023-05-13 03:28:29,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +10: [2023-05-13 03:28:29,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +24: [2023-05-13 03:28:29,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +13: [2023-05-13 03:28:29,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +13: [2023-05-13 03:28:29,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +10: [2023-05-13 03:28:29,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +13: [2023-05-13 03:28:29,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +24: [2023-05-13 03:28:29,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +11: [2023-05-13 03:28:29,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +11: [2023-05-13 03:28:29,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +29: [2023-05-13 03:28:29,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +11: [2023-05-13 03:28:29,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +11: [2023-05-13 03:28:29,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +11: [2023-05-13 03:28:29,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +11: [2023-05-13 03:28:29,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +11: [2023-05-13 03:28:29,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +12: [2023-05-13 03:28:29,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +13: [2023-05-13 03:28:29,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +14: [2023-05-13 03:28:29,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +13: [2023-05-13 03:28:29,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +14: [2023-05-13 03:28:29,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +30: [2023-05-13 03:28:29,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +30: [2023-05-13 03:28:29,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +30: [2023-05-13 03:28:29,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +30: [2023-05-13 03:28:29,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +30: [2023-05-13 03:28:29,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +30: [2023-05-13 03:28:29,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +30: [2023-05-13 03:28:29,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +30: [2023-05-13 03:28:29,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +12: [2023-05-13 03:28:29,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +12: [2023-05-13 03:28:29,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +28: [2023-05-13 03:28:29,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +28: [2023-05-13 03:28:29,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +28: [2023-05-13 03:28:29,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +14: [2023-05-13 03:28:29,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +14: [2023-05-13 03:28:29,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +28: [2023-05-13 03:28:29,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +28: [2023-05-13 03:28:29,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +28: [2023-05-13 03:28:29,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +13: [2023-05-13 03:28:29,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +29: [2023-05-13 03:28:29,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +13: [2023-05-13 03:28:29,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +30: [2023-05-13 03:28:29,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +30: [2023-05-13 03:28:29,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +30: [2023-05-13 03:28:29,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +30: [2023-05-13 03:28:29,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +30: [2023-05-13 03:28:29,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +30: [2023-05-13 03:28:29,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +30: [2023-05-13 03:28:29,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +31: [2023-05-13 03:28:29,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +31: [2023-05-13 03:28:29,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +30: [2023-05-13 03:28:29,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +12: [2023-05-13 03:28:29,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +12: [2023-05-13 03:28:29,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +29: [2023-05-13 03:28:29,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +12: [2023-05-13 03:28:29,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +12: [2023-05-13 03:28:29,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +12: [2023-05-13 03:28:29,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +29: [2023-05-13 03:28:29,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +13: [2023-05-13 03:28:29,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +13: [2023-05-13 03:28:29,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +13: [2023-05-13 03:28:29,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +13: [2023-05-13 03:28:29,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +11: [2023-05-13 03:28:29,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +20: [2023-05-13 03:28:29,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +20: [2023-05-13 03:28:29,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +29: [2023-05-13 03:28:29,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +10: [2023-05-13 03:28:29,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +29: [2023-05-13 03:28:29,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +31: [2023-05-13 03:28:29,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +31: [2023-05-13 03:28:29,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +31: [2023-05-13 03:28:29,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +31: [2023-05-13 03:28:29,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +31: [2023-05-13 03:28:29,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +29: [2023-05-13 03:28:29,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +29: [2023-05-13 03:28:29,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +29: [2023-05-13 03:28:29,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +29: [2023-05-13 03:28:29,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +10: [2023-05-13 03:28:29,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +31: [2023-05-13 03:28:29,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +31: [2023-05-13 03:28:29,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +31: [2023-05-13 03:28:29,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +18: [2023-05-13 03:28:29,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +18: [2023-05-13 03:28:29,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +18: [2023-05-13 03:28:29,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +19: [2023-05-13 03:28:29,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +29: [2023-05-13 03:28:29,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +20: [2023-05-13 03:28:29,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +19: [2023-05-13 03:28:29,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +19: [2023-05-13 03:28:29,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +11: [2023-05-13 03:28:29,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +18: [2023-05-13 03:28:29,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +24: [2023-05-13 03:28:29,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +24: [2023-05-13 03:28:29,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +18: [2023-05-13 03:28:29,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +20: [2023-05-13 03:28:29,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +24: [2023-05-13 03:28:29,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +10: [2023-05-13 03:28:29,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +19: [2023-05-13 03:28:29,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +19: [2023-05-13 03:28:29,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +19: [2023-05-13 03:28:29,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +19: [2023-05-13 03:28:29,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +19: [2023-05-13 03:28:29,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +18: [2023-05-13 03:28:29,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +20: [2023-05-13 03:28:29,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +20: [2023-05-13 03:28:29,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +20: [2023-05-13 03:28:29,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +20: [2023-05-13 03:28:29,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +24: [2023-05-13 03:28:29,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +20: [2023-05-13 03:28:29,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +20: [2023-05-13 03:28:29,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +24: [2023-05-13 03:28:29,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +24: [2023-05-13 03:28:29,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +24: [2023-05-13 03:28:29,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +24: [2023-05-13 03:28:29,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +10: [2023-05-13 03:28:29,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +29: [2023-05-13 03:28:29,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +10: [2023-05-13 03:28:29,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +18: [2023-05-13 03:28:29,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +18: [2023-05-13 03:28:29,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +10: [2023-05-13 03:28:29,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +10: [2023-05-13 03:28:29,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +10: [2023-05-13 03:28:29,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +10: [2023-05-13 03:28:29,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +10: [2023-05-13 03:28:29,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +30: [2023-05-13 03:28:29,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +30: [2023-05-13 03:28:29,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +11: [2023-05-13 03:28:29,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +11: [2023-05-13 03:28:29,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +11: [2023-05-13 03:28:29,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +30: [2023-05-13 03:28:29,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +18: [2023-05-13 03:28:29,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +18: [2023-05-13 03:28:29,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +23: [2023-05-13 03:28:29,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +23: [2023-05-13 03:28:29,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +23: [2023-05-13 03:28:29,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +23: [2023-05-13 03:28:29,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +18: [2023-05-13 03:28:29,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +23: [2023-05-13 03:28:29,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +23: [2023-05-13 03:28:29,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +23: [2023-05-13 03:28:29,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +23: [2023-05-13 03:28:29,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +29: [2023-05-13 03:28:29,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +30: [2023-05-13 03:28:29,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +29: [2023-05-13 03:28:29,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +19: [2023-05-13 03:28:29,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +19: [2023-05-13 03:28:29,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +19: [2023-05-13 03:28:29,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +30: [2023-05-13 03:28:29,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +31: [2023-05-13 03:28:29,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +31: [2023-05-13 03:28:29,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +31: [2023-05-13 03:28:29,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +11: [2023-05-13 03:28:29,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +11: [2023-05-13 03:28:29,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +11: [2023-05-13 03:28:29,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +31: [2023-05-13 03:28:29,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +20: [2023-05-13 03:28:29,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +23: [2023-05-13 03:28:29,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +23: [2023-05-13 03:28:29,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +20: [2023-05-13 03:28:29,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +29: [2023-05-13 03:28:29,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +29: [2023-05-13 03:28:29,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +24: [2023-05-13 03:28:29,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +18: [2023-05-13 03:28:29,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +31: [2023-05-13 03:28:29,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +24: [2023-05-13 03:28:29,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +24: [2023-05-13 03:28:29,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +18: [2023-05-13 03:28:29,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +31: [2023-05-13 03:28:29,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +23: [2023-05-13 03:28:29,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +23: [2023-05-13 03:28:29,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +23: [2023-05-13 03:28:29,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +23: [2023-05-13 03:28:29,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +23: [2023-05-13 03:28:29,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +23: [2023-05-13 03:28:29,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +15: [2023-05-13 03:28:29,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +15: [2023-05-13 03:28:29,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +15: [2023-05-13 03:28:29,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +15: [2023-05-13 03:28:29,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +15: [2023-05-13 03:28:29,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +15: [2023-05-13 03:28:29,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +15: [2023-05-13 03:28:29,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +15: [2023-05-13 03:28:29,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +18: [2023-05-13 03:28:29,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +27: [2023-05-13 03:28:29,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +27: [2023-05-13 03:28:29,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +15: [2023-05-13 03:28:29,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +27: [2023-05-13 03:28:29,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +30: [2023-05-13 03:28:29,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +30: [2023-05-13 03:28:29,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +30: [2023-05-13 03:28:29,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +27: [2023-05-13 03:28:29,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +27: [2023-05-13 03:28:29,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +27: [2023-05-13 03:28:29,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +27: [2023-05-13 03:28:29,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +27: [2023-05-13 03:28:29,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +19: [2023-05-13 03:28:29,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +19: [2023-05-13 03:28:29,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +19: [2023-05-13 03:28:29,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +27: [2023-05-13 03:28:29,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +24: [2023-05-13 03:28:29,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +19: [2023-05-13 03:28:29,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +19: [2023-05-13 03:28:29,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +18: [2023-05-13 03:28:29,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +24: [2023-05-13 03:28:29,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +18: [2023-05-13 03:28:29,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +20: [2023-05-13 03:28:29,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +24: [2023-05-13 03:28:29,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +20: [2023-05-13 03:28:29,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +30: [2023-05-13 03:28:29,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +30: [2023-05-13 03:28:29,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +20: [2023-05-13 03:28:29,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +24: [2023-05-13 03:28:29,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +24: [2023-05-13 03:28:29,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +15: [2023-05-13 03:28:29,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +27: [2023-05-13 03:28:29,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +15: [2023-05-13 03:28:29,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +20: [2023-05-13 03:28:29,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +30: [2023-05-13 03:28:29,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +10: [2023-05-13 03:28:29,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +10: [2023-05-13 03:28:29,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +15: [2023-05-13 03:28:29,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +27: [2023-05-13 03:28:29,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +10: [2023-05-13 03:28:29,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +27: [2023-05-13 03:28:29,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +27: [2023-05-13 03:28:29,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +27: [2023-05-13 03:28:29,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +27: [2023-05-13 03:28:29,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +30: [2023-05-13 03:28:29,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +27: [2023-05-13 03:28:29,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +30: [2023-05-13 03:28:29,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +10: [2023-05-13 03:28:29,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +17: [2023-05-13 03:28:29,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +17: [2023-05-13 03:28:29,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +17: [2023-05-13 03:28:29,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +17: [2023-05-13 03:28:29,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +17: [2023-05-13 03:28:29,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +17: [2023-05-13 03:28:29,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +17: [2023-05-13 03:28:29,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +22: [2023-05-13 03:28:29,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +22: [2023-05-13 03:28:29,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +17: [2023-05-13 03:28:29,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +22: [2023-05-13 03:28:29,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +22: [2023-05-13 03:28:29,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +22: [2023-05-13 03:28:29,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +22: [2023-05-13 03:28:29,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +22: [2023-05-13 03:28:29,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +22: [2023-05-13 03:28:29,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +10: [2023-05-13 03:28:29,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +17: [2023-05-13 03:28:29,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +10: [2023-05-13 03:28:29,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +22: [2023-05-13 03:28:29,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +30: [2023-05-13 03:28:29,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +30: [2023-05-13 03:28:29,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +30: [2023-05-13 03:28:29,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +22: [2023-05-13 03:28:29,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +22: [2023-05-13 03:28:29,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +22: [2023-05-13 03:28:29,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +22: [2023-05-13 03:28:29,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +17: [2023-05-13 03:28:29,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +17: [2023-05-13 03:28:29,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +17: [2023-05-13 03:28:29,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +17: [2023-05-13 03:28:29,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +25: [2023-05-13 03:28:29,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +25: [2023-05-13 03:28:29,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +21: [2023-05-13 03:28:29,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +21: [2023-05-13 03:28:29,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +17: [2023-05-13 03:28:29,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +11: [2023-05-13 03:28:29,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +11: [2023-05-13 03:28:29,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +11: [2023-05-13 03:28:29,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +11: [2023-05-13 03:28:29,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +11: [2023-05-13 03:28:29,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +11: [2023-05-13 03:28:29,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +11: [2023-05-13 03:28:29,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +11: [2023-05-13 03:28:29,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +25: [2023-05-13 03:28:29,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +25: [2023-05-13 03:28:29,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +17: [2023-05-13 03:28:29,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +25: [2023-05-13 03:28:29,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +25: [2023-05-13 03:28:29,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +25: [2023-05-13 03:28:29,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +17: [2023-05-13 03:28:29,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +25: [2023-05-13 03:28:29,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +21: [2023-05-13 03:28:29,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +21: [2023-05-13 03:28:29,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +21: [2023-05-13 03:28:29,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +21: [2023-05-13 03:28:29,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +21: [2023-05-13 03:28:29,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +16: [2023-05-13 03:28:29,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +16: [2023-05-13 03:28:29,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +21: [2023-05-13 03:28:29,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +21: [2023-05-13 03:28:29,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +16: [2023-05-13 03:28:29,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +16: [2023-05-13 03:28:29,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +16: [2023-05-13 03:28:29,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +16: [2023-05-13 03:28:29,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +16: [2023-05-13 03:28:29,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +16: [2023-05-13 03:28:29,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +21: [2023-05-13 03:28:29,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +25: [2023-05-13 03:28:29,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +25: [2023-05-13 03:28:29,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +25: [2023-05-13 03:28:29,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +21: [2023-05-13 03:28:29,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +15: [2023-05-13 03:28:29,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +16: [2023-05-13 03:28:29,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +25: [2023-05-13 03:28:29,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +25: [2023-05-13 03:28:29,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +16: [2023-05-13 03:28:29,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +25: [2023-05-13 03:28:29,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +23: [2023-05-13 03:28:29,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +16: [2023-05-13 03:28:29,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +25: [2023-05-13 03:28:29,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +21: [2023-05-13 03:28:29,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +21: [2023-05-13 03:28:29,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +25: [2023-05-13 03:28:29,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +21: [2023-05-13 03:28:29,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +16: [2023-05-13 03:28:29,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +16: [2023-05-13 03:28:29,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +21: [2023-05-13 03:28:29,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +21: [2023-05-13 03:28:29,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +16: [2023-05-13 03:28:29,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +23: [2023-05-13 03:28:29,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +16: [2023-05-13 03:28:29,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +16: [2023-05-13 03:28:29,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +27: [2023-05-13 03:28:29,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +23: [2023-05-13 03:28:29,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +23: [2023-05-13 03:28:29,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +23: [2023-05-13 03:28:29,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +23: [2023-05-13 03:28:29,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +23: [2023-05-13 03:28:29,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +23: [2023-05-13 03:28:29,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +23: [2023-05-13 03:28:29,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +17: [2023-05-13 03:28:29,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +23: [2023-05-13 03:28:29,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +27: [2023-05-13 03:28:29,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +15: [2023-05-13 03:28:29,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +22: [2023-05-13 03:28:29,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +21: [2023-05-13 03:28:29,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +26: [2023-05-13 03:28:29,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +26: [2023-05-13 03:28:29,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +15: [2023-05-13 03:28:29,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +15: [2023-05-13 03:28:29,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +15: [2023-05-13 03:28:29,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +15: [2023-05-13 03:28:29,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +15: [2023-05-13 03:28:29,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +15: [2023-05-13 03:28:29,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +27: [2023-05-13 03:28:29,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +26: [2023-05-13 03:28:29,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +26: [2023-05-13 03:28:29,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +26: [2023-05-13 03:28:29,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +26: [2023-05-13 03:28:29,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +26: [2023-05-13 03:28:29,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +26: [2023-05-13 03:28:29,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +26: [2023-05-13 03:28:29,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +26: [2023-05-13 03:28:29,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +27: [2023-05-13 03:28:29,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +17: [2023-05-13 03:28:29,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +22: [2023-05-13 03:28:29,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +27: [2023-05-13 03:28:29,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +26: [2023-05-13 03:28:29,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +25: [2023-05-13 03:28:29,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +25: [2023-05-13 03:28:29,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +25: [2023-05-13 03:28:29,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +21: [2023-05-13 03:28:29,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +21: [2023-05-13 03:28:29,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +26: [2023-05-13 03:28:29,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +26: [2023-05-13 03:28:29,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +26: [2023-05-13 03:28:29,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +26: [2023-05-13 03:28:29,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +26: [2023-05-13 03:28:29,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt... +23: [2023-05-13 03:28:29,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +25: [2023-05-13 03:28:29,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +25: [2023-05-13 03:28:29,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +16: [2023-05-13 03:28:29,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +16: [2023-05-13 03:28:29,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +16: [2023-05-13 03:28:29,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +23: [2023-05-13 03:28:29,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +23: [2023-05-13 03:28:29,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +23: [2023-05-13 03:28:29,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +23: [2023-05-13 03:28:29,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +27: [2023-05-13 03:28:29,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +27: [2023-05-13 03:28:29,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +27: [2023-05-13 03:28:29,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +27: [2023-05-13 03:28:29,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +22: [2023-05-13 03:28:29,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +22: [2023-05-13 03:28:29,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +21: [2023-05-13 03:28:29,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +16: [2023-05-13 03:28:29,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +16: [2023-05-13 03:28:29,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +16: [2023-05-13 03:28:29,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +16: [2023-05-13 03:28:29,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +16: [2023-05-13 03:28:29,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +23: [2023-05-13 03:28:29,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +22: [2023-05-13 03:28:29,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +22: [2023-05-13 03:28:29,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +25: [2023-05-13 03:28:29,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +21: [2023-05-13 03:28:29,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +21: [2023-05-13 03:28:29,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +22: [2023-05-13 03:28:29,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +17: [2023-05-13 03:28:29,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +17: [2023-05-13 03:28:29,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +17: [2023-05-13 03:28:29,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +17: [2023-05-13 03:28:29,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +17: [2023-05-13 03:28:29,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +17: [2023-05-13 03:28:29,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +17: [2023-05-13 03:28:29,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +21: [2023-05-13 03:28:29,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +21: [2023-05-13 03:28:29,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +21: [2023-05-13 03:28:29,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +25: [2023-05-13 03:28:29,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +25: [2023-05-13 03:28:29,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +27: [2023-05-13 03:28:29,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +25: [2023-05-13 03:28:29,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +21: [2023-05-13 03:28:29,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +25: [2023-05-13 03:28:29,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +25: [2023-05-13 03:28:29,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +16: [2023-05-13 03:28:29,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +21: [2023-05-13 03:28:29,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +25: [2023-05-13 03:28:29,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +27: [2023-05-13 03:28:29,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +27: [2023-05-13 03:28:29,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +16: [2023-05-13 03:28:29,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +16: [2023-05-13 03:28:29,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +25: [2023-05-13 03:28:29,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +16: [2023-05-13 03:28:29,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +16: [2023-05-13 03:28:29,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +16: [2023-05-13 03:28:29,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +16: [2023-05-13 03:28:29,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +16: [2023-05-13 03:28:29,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +25: [2023-05-13 03:28:29,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +21: [2023-05-13 03:28:29,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +27: [2023-05-13 03:28:29,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +27: [2023-05-13 03:28:29,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +25: [2023-05-13 03:28:29,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +21: [2023-05-13 03:28:29,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +21: [2023-05-13 03:28:29,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +21: [2023-05-13 03:28:29,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +21: [2023-05-13 03:28:29,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +27: [2023-05-13 03:28:29,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +27: [2023-05-13 03:28:29,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +25: [2023-05-13 03:28:29,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +26: [2023-05-13 03:28:29,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +26: [2023-05-13 03:28:29,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +26: [2023-05-13 03:28:29,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +17: [2023-05-13 03:28:29,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +17: [2023-05-13 03:28:29,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +17: [2023-05-13 03:28:29,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +17: [2023-05-13 03:28:29,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +17: [2023-05-13 03:28:29,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +17: [2023-05-13 03:28:29,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +17: [2023-05-13 03:28:29,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +26: [2023-05-13 03:28:29,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +26: [2023-05-13 03:28:29,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +26: [2023-05-13 03:28:29,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +26: [2023-05-13 03:28:29,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +26: [2023-05-13 03:28:29,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_19-model_00-model_states.pt. +26: [2023-05-13 03:28:29,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +26: [2023-05-13 03:28:29,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +26: [2023-05-13 03:28:29,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +26: [2023-05-13 03:28:29,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +26: [2023-05-13 03:28:29,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +26: [2023-05-13 03:28:29,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +26: [2023-05-13 03:28:29,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +26: [2023-05-13 03:28:29,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +12: [2023-05-13 03:28:29,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +12: [2023-05-13 03:28:29,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +12: [2023-05-13 03:28:29,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +12: [2023-05-13 03:28:29,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +12: [2023-05-13 03:28:29,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +12: [2023-05-13 03:28:29,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +12: [2023-05-13 03:28:29,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +12: [2023-05-13 03:28:29,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +12: [2023-05-13 03:28:29,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +12: [2023-05-13 03:28:29,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +12: [2023-05-13 03:28:29,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +12: [2023-05-13 03:28:29,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +12: [2023-05-13 03:28:29,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +12: [2023-05-13 03:28:29,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +12: [2023-05-13 03:28:29,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +12: [2023-05-13 03:28:29,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +13: [2023-05-13 03:28:29,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +13: [2023-05-13 03:28:29,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +13: [2023-05-13 03:28:29,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +13: [2023-05-13 03:28:29,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +13: [2023-05-13 03:28:29,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +13: [2023-05-13 03:28:29,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +13: [2023-05-13 03:28:29,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +13: [2023-05-13 03:28:29,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +13: [2023-05-13 03:28:29,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +13: [2023-05-13 03:28:29,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +13: [2023-05-13 03:28:29,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +13: [2023-05-13 03:28:29,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +13: [2023-05-13 03:28:29,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +13: [2023-05-13 03:28:29,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +13: [2023-05-13 03:28:29,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +13: [2023-05-13 03:28:29,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +11: [2023-05-13 03:28:29,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +11: [2023-05-13 03:28:29,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +11: [2023-05-13 03:28:29,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +11: [2023-05-13 03:28:29,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +11: [2023-05-13 03:28:29,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +11: [2023-05-13 03:28:29,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +11: [2023-05-13 03:28:29,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +11: [2023-05-13 03:28:29,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +18: [2023-05-13 03:28:29,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +18: [2023-05-13 03:28:29,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +18: [2023-05-13 03:28:29,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +18: [2023-05-13 03:28:29,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +18: [2023-05-13 03:28:29,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +18: [2023-05-13 03:28:29,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +18: [2023-05-13 03:28:29,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +18: [2023-05-13 03:28:29,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +11: [2023-05-13 03:28:29,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +29: [2023-05-13 03:28:29,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +29: [2023-05-13 03:28:29,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +29: [2023-05-13 03:28:29,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +29: [2023-05-13 03:28:29,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +29: [2023-05-13 03:28:29,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +29: [2023-05-13 03:28:29,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +29: [2023-05-13 03:28:29,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +29: [2023-05-13 03:28:29,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +18: [2023-05-13 03:28:29,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +18: [2023-05-13 03:28:29,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +18: [2023-05-13 03:28:29,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +29: [2023-05-13 03:28:29,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +29: [2023-05-13 03:28:29,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +18: [2023-05-13 03:28:29,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +18: [2023-05-13 03:28:29,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +14: [2023-05-13 03:28:29,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +14: [2023-05-13 03:28:29,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +14: [2023-05-13 03:28:29,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +18: [2023-05-13 03:28:29,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +14: [2023-05-13 03:28:29,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +14: [2023-05-13 03:28:29,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +14: [2023-05-13 03:28:29,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +14: [2023-05-13 03:28:29,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +18: [2023-05-13 03:28:29,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +14: [2023-05-13 03:28:29,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +18: [2023-05-13 03:28:29,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +11: [2023-05-13 03:28:29,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +11: [2023-05-13 03:28:29,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +29: [2023-05-13 03:28:29,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +11: [2023-05-13 03:28:29,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +11: [2023-05-13 03:28:29,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +11: [2023-05-13 03:28:29,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +29: [2023-05-13 03:28:29,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +11: [2023-05-13 03:28:29,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +12: [2023-05-13 03:28:29,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +11: [2023-05-13 03:28:29,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +29: [2023-05-13 03:28:29,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +29: [2023-05-13 03:28:29,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +29: [2023-05-13 03:28:29,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +29: [2023-05-13 03:28:29,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +14: [2023-05-13 03:28:29,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +14: [2023-05-13 03:28:29,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +14: [2023-05-13 03:28:29,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +14: [2023-05-13 03:28:29,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +14: [2023-05-13 03:28:29,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +14: [2023-05-13 03:28:29,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +14: [2023-05-13 03:28:29,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +14: [2023-05-13 03:28:29,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +12: [2023-05-13 03:28:29,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +12: [2023-05-13 03:28:29,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +19: [2023-05-13 03:28:29,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +19: [2023-05-13 03:28:29,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +19: [2023-05-13 03:28:29,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +19: [2023-05-13 03:28:29,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +19: [2023-05-13 03:28:29,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +19: [2023-05-13 03:28:29,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +19: [2023-05-13 03:28:29,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +12: [2023-05-13 03:28:29,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +19: [2023-05-13 03:28:29,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +12: [2023-05-13 03:28:29,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +19: [2023-05-13 03:28:29,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +19: [2023-05-13 03:28:29,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +19: [2023-05-13 03:28:29,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +19: [2023-05-13 03:28:29,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +19: [2023-05-13 03:28:29,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +19: [2023-05-13 03:28:29,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +19: [2023-05-13 03:28:29,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +12: [2023-05-13 03:28:29,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +12: [2023-05-13 03:28:29,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +12: [2023-05-13 03:28:29,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +12: [2023-05-13 03:28:29,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +19: [2023-05-13 03:28:29,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +13: [2023-05-13 03:28:29,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +13: [2023-05-13 03:28:29,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +13: [2023-05-13 03:28:29,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +11: [2023-05-13 03:28:29,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +12: [2023-05-13 03:28:29,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +12: [2023-05-13 03:28:29,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +12: [2023-05-13 03:28:29,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +13: [2023-05-13 03:28:29,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +29: [2023-05-13 03:28:29,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +29: [2023-05-13 03:28:29,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +13: [2023-05-13 03:28:29,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +13: [2023-05-13 03:28:29,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +13: [2023-05-13 03:28:29,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +13: [2023-05-13 03:28:29,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +18: [2023-05-13 03:28:29,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +18: [2023-05-13 03:28:29,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +18: [2023-05-13 03:28:29,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +14: [2023-05-13 03:28:29,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +11: [2023-05-13 03:28:29,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +12: [2023-05-13 03:28:29,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +14: [2023-05-13 03:28:29,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +12: [2023-05-13 03:28:29,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +13: [2023-05-13 03:28:29,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +12: [2023-05-13 03:28:29,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +12: [2023-05-13 03:28:29,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +18: [2023-05-13 03:28:29,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +29: [2023-05-13 03:28:29,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +14: [2023-05-13 03:28:29,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +18: [2023-05-13 03:28:29,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +18: [2023-05-13 03:28:29,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +18: [2023-05-13 03:28:29,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +18: [2023-05-13 03:28:29,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +13: [2023-05-13 03:28:29,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +13: [2023-05-13 03:28:29,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +29: [2023-05-13 03:28:29,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +11: [2023-05-13 03:28:29,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +10: [2023-05-13 03:28:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +10: [2023-05-13 03:28:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +10: [2023-05-13 03:28:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +10: [2023-05-13 03:28:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +10: [2023-05-13 03:28:29,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +10: [2023-05-13 03:28:29,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +10: [2023-05-13 03:28:29,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +10: [2023-05-13 03:28:29,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +29: [2023-05-13 03:28:29,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +14: [2023-05-13 03:28:29,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +29: [2023-05-13 03:28:29,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +29: [2023-05-13 03:28:29,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 0: [2023-05-13 03:28:29,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +14: [2023-05-13 03:28:29,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +14: [2023-05-13 03:28:29,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +14: [2023-05-13 03:28:29,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +14: [2023-05-13 03:28:29,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +10: [2023-05-13 03:28:29,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +10: [2023-05-13 03:28:29,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +18: [2023-05-13 03:28:29,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +18: [2023-05-13 03:28:29,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +11: [2023-05-13 03:28:29,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +11: [2023-05-13 03:28:29,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +11: [2023-05-13 03:28:29,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +18: [2023-05-13 03:28:29,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 0: [2023-05-13 03:28:29,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +13: [2023-05-13 03:28:29,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +13: [2023-05-13 03:28:29,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +10: [2023-05-13 03:28:29,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +13: [2023-05-13 03:28:29,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +10: [2023-05-13 03:28:29,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +10: [2023-05-13 03:28:29,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +10: [2023-05-13 03:28:29,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +21: [2023-05-13 03:28:29,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +21: [2023-05-13 03:28:29,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +10: [2023-05-13 03:28:29,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +10: [2023-05-13 03:28:29,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +13: [2023-05-13 03:28:29,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +13: [2023-05-13 03:28:29,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +24: [2023-05-13 03:28:29,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +24: [2023-05-13 03:28:29,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +24: [2023-05-13 03:28:29,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +24: [2023-05-13 03:28:29,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +24: [2023-05-13 03:28:29,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +24: [2023-05-13 03:28:29,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +24: [2023-05-13 03:28:29,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +21: [2023-05-13 03:28:29,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +24: [2023-05-13 03:28:29,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +21: [2023-05-13 03:28:29,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +21: [2023-05-13 03:28:29,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +21: [2023-05-13 03:28:29,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +21: [2023-05-13 03:28:29,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +11: [2023-05-13 03:28:29,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +21: [2023-05-13 03:28:29,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +11: [2023-05-13 03:28:29,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +11: [2023-05-13 03:28:29,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +29: [2023-05-13 03:28:29,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +29: [2023-05-13 03:28:29,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +29: [2023-05-13 03:28:29,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +19: [2023-05-13 03:28:29,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +19: [2023-05-13 03:28:29,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +14: [2023-05-13 03:28:29,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +28: [2023-05-13 03:28:29,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +21: [2023-05-13 03:28:29,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +21: [2023-05-13 03:28:29,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +28: [2023-05-13 03:28:29,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +28: [2023-05-13 03:28:29,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +28: [2023-05-13 03:28:29,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +28: [2023-05-13 03:28:29,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +28: [2023-05-13 03:28:29,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +28: [2023-05-13 03:28:29,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +14: [2023-05-13 03:28:29,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +28: [2023-05-13 03:28:29,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +15: [2023-05-13 03:28:29,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +15: [2023-05-13 03:28:29,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +15: [2023-05-13 03:28:29,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +15: [2023-05-13 03:28:29,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +15: [2023-05-13 03:28:29,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +15: [2023-05-13 03:28:29,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +21: [2023-05-13 03:28:29,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +22: [2023-05-13 03:28:29,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +22: [2023-05-13 03:28:29,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +22: [2023-05-13 03:28:29,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +22: [2023-05-13 03:28:29,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +27: [2023-05-13 03:28:29,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +27: [2023-05-13 03:28:29,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +27: [2023-05-13 03:28:29,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +22: [2023-05-13 03:28:29,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +22: [2023-05-13 03:28:29,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +22: [2023-05-13 03:28:29,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +24: [2023-05-13 03:28:29,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +27: [2023-05-13 03:28:29,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +27: [2023-05-13 03:28:29,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +27: [2023-05-13 03:28:29,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +27: [2023-05-13 03:28:29,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +22: [2023-05-13 03:28:29,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +27: [2023-05-13 03:28:29,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +21: [2023-05-13 03:28:29,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +24: [2023-05-13 03:28:29,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +24: [2023-05-13 03:28:29,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +29: [2023-05-13 03:28:29,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +19: [2023-05-13 03:28:29,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +19: [2023-05-13 03:28:29,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +28: [2023-05-13 03:28:29,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +21: [2023-05-13 03:28:29,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +15: [2023-05-13 03:28:29,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +14: [2023-05-13 03:28:29,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +24: [2023-05-13 03:28:29,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +24: [2023-05-13 03:28:29,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +24: [2023-05-13 03:28:29,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +24: [2023-05-13 03:28:29,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +24: [2023-05-13 03:28:29,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +21: [2023-05-13 03:28:29,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +21: [2023-05-13 03:28:29,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +18: [2023-05-13 03:28:29,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +27: [2023-05-13 03:28:29,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +21: [2023-05-13 03:28:29,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +19: [2023-05-13 03:28:29,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +18: [2023-05-13 03:28:29,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +11: [2023-05-13 03:28:29,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +27: [2023-05-13 03:28:29,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +18: [2023-05-13 03:28:29,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +22: [2023-05-13 03:28:29,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +18: [2023-05-13 03:28:29,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +18: [2023-05-13 03:28:29,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +22: [2023-05-13 03:28:29,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +28: [2023-05-13 03:28:29,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +28: [2023-05-13 03:28:29,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +29: [2023-05-13 03:28:29,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +19: [2023-05-13 03:28:29,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +28: [2023-05-13 03:28:29,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +27: [2023-05-13 03:28:29,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +28: [2023-05-13 03:28:29,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +28: [2023-05-13 03:28:29,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +28: [2023-05-13 03:28:29,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +27: [2023-05-13 03:28:29,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +29: [2023-05-13 03:28:29,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +15: [2023-05-13 03:28:29,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +27: [2023-05-13 03:28:29,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +19: [2023-05-13 03:28:29,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +15: [2023-05-13 03:28:29,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +28: [2023-05-13 03:28:29,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +27: [2023-05-13 03:28:29,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +27: [2023-05-13 03:28:29,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +27: [2023-05-13 03:28:29,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +14: [2023-05-13 03:28:29,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +14: [2023-05-13 03:28:29,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +14: [2023-05-13 03:28:29,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +14: [2023-05-13 03:28:29,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +19: [2023-05-13 03:28:29,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +14: [2023-05-13 03:28:29,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +11: [2023-05-13 03:28:29,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +11: [2023-05-13 03:28:29,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +19: [2023-05-13 03:28:29,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +11: [2023-05-13 03:28:29,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +23: [2023-05-13 03:28:29,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +23: [2023-05-13 03:28:29,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +29: [2023-05-13 03:28:29,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +29: [2023-05-13 03:28:29,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +29: [2023-05-13 03:28:29,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +11: [2023-05-13 03:28:29,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +19: [2023-05-13 03:28:29,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +31: [2023-05-13 03:28:29,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +31: [2023-05-13 03:28:29,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +11: [2023-05-13 03:28:29,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +23: [2023-05-13 03:28:29,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +23: [2023-05-13 03:28:29,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +23: [2023-05-13 03:28:29,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +23: [2023-05-13 03:28:29,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +23: [2023-05-13 03:28:29,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +23: [2023-05-13 03:28:29,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +31: [2023-05-13 03:28:29,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +31: [2023-05-13 03:28:29,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +31: [2023-05-13 03:28:29,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +31: [2023-05-13 03:28:29,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +31: [2023-05-13 03:28:29,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +31: [2023-05-13 03:28:29,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +19: [2023-05-13 03:28:29,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +19: [2023-05-13 03:28:29,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +11: [2023-05-13 03:28:29,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +23: [2023-05-13 03:28:29,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +31: [2023-05-13 03:28:29,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +23: [2023-05-13 03:28:29,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +31: [2023-05-13 03:28:29,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +23: [2023-05-13 03:28:29,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +19: [2023-05-13 03:28:29,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +23: [2023-05-13 03:28:29,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +23: [2023-05-13 03:28:29,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +10: [2023-05-13 03:28:29,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +10: [2023-05-13 03:28:29,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +23: [2023-05-13 03:28:29,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +23: [2023-05-13 03:28:29,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +23: [2023-05-13 03:28:29,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +31: [2023-05-13 03:28:29,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +31: [2023-05-13 03:28:29,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +31: [2023-05-13 03:28:29,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +31: [2023-05-13 03:28:29,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +31: [2023-05-13 03:28:29,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +31: [2023-05-13 03:28:29,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +19: [2023-05-13 03:28:29,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +19: [2023-05-13 03:28:29,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +19: [2023-05-13 03:28:29,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +28: [2023-05-13 03:28:29,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +15: [2023-05-13 03:28:29,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +21: [2023-05-13 03:28:29,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +21: [2023-05-13 03:28:29,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +21: [2023-05-13 03:28:29,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +21: [2023-05-13 03:28:29,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +27: [2023-05-13 03:28:29,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +24: [2023-05-13 03:28:29,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +24: [2023-05-13 03:28:29,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +10: [2023-05-13 03:28:29,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +10: [2023-05-13 03:28:29,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +24: [2023-05-13 03:28:29,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +21: [2023-05-13 03:28:29,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +24: [2023-05-13 03:28:29,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +10: [2023-05-13 03:28:29,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +20: [2023-05-13 03:28:29,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +20: [2023-05-13 03:28:29,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +20: [2023-05-13 03:28:29,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +20: [2023-05-13 03:28:29,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +20: [2023-05-13 03:28:29,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +20: [2023-05-13 03:28:29,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +20: [2023-05-13 03:28:29,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +20: [2023-05-13 03:28:29,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +10: [2023-05-13 03:28:29,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +10: [2023-05-13 03:28:29,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +10: [2023-05-13 03:28:29,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +10: [2023-05-13 03:28:29,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +10: [2023-05-13 03:28:29,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +20: [2023-05-13 03:28:29,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +28: [2023-05-13 03:28:29,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +20: [2023-05-13 03:28:29,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +30: [2023-05-13 03:28:29,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +30: [2023-05-13 03:28:29,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:29,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +30: [2023-05-13 03:28:29,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +30: [2023-05-13 03:28:29,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +30: [2023-05-13 03:28:29,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +30: [2023-05-13 03:28:29,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +30: [2023-05-13 03:28:29,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +15: [2023-05-13 03:28:29,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +20: [2023-05-13 03:28:29,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +20: [2023-05-13 03:28:29,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +31: [2023-05-13 03:28:29,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +20: [2023-05-13 03:28:29,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +24: [2023-05-13 03:28:29,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +24: [2023-05-13 03:28:29,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +24: [2023-05-13 03:28:29,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +24: [2023-05-13 03:28:29,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +20: [2023-05-13 03:28:29,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +20: [2023-05-13 03:28:29,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +20: [2023-05-13 03:28:29,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +30: [2023-05-13 03:28:29,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +21: [2023-05-13 03:28:29,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +21: [2023-05-13 03:28:29,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +21: [2023-05-13 03:28:29,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +22: [2023-05-13 03:28:29,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:29,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +30: [2023-05-13 03:28:29,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +27: [2023-05-13 03:28:29,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:29,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +21: [2023-05-13 03:28:29,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +21: [2023-05-13 03:28:29,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:29,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +22: [2023-05-13 03:28:29,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:29,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +30: [2023-05-13 03:28:29,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 4: [2023-05-13 03:28:29,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:29,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +21: [2023-05-13 03:28:29,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 4: [2023-05-13 03:28:29,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +21: [2023-05-13 03:28:29,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +22: [2023-05-13 03:28:29,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +22: [2023-05-13 03:28:29,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +22: [2023-05-13 03:28:29,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +22: [2023-05-13 03:28:29,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +24: [2023-05-13 03:28:29,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +28: [2023-05-13 03:28:29,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +28: [2023-05-13 03:28:29,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +28: [2023-05-13 03:28:29,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +27: [2023-05-13 03:28:29,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +23: [2023-05-13 03:28:29,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +28: [2023-05-13 03:28:29,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +28: [2023-05-13 03:28:29,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +28: [2023-05-13 03:28:29,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +27: [2023-05-13 03:28:29,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +23: [2023-05-13 03:28:29,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +15: [2023-05-13 03:28:29,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +15: [2023-05-13 03:28:29,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +15: [2023-05-13 03:28:29,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +15: [2023-05-13 03:28:29,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +21: [2023-05-13 03:28:29,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +24: [2023-05-13 03:28:29,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +15: [2023-05-13 03:28:29,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +15: [2023-05-13 03:28:29,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +15: [2023-05-13 03:28:29,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +31: [2023-05-13 03:28:29,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +24: [2023-05-13 03:28:29,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +24: [2023-05-13 03:28:29,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 7: [2023-05-13 03:28:29,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 7: [2023-05-13 03:28:29,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +25: [2023-05-13 03:28:29,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +25: [2023-05-13 03:28:29,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +22: [2023-05-13 03:28:29,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +25: [2023-05-13 03:28:29,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +25: [2023-05-13 03:28:29,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +25: [2023-05-13 03:28:29,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +25: [2023-05-13 03:28:29,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +25: [2023-05-13 03:28:29,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +25: [2023-05-13 03:28:29,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +31: [2023-05-13 03:28:29,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +10: [2023-05-13 03:28:29,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +10: [2023-05-13 03:28:29,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +10: [2023-05-13 03:28:29,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 5: [2023-05-13 03:28:29,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +25: [2023-05-13 03:28:29,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +25: [2023-05-13 03:28:29,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +25: [2023-05-13 03:28:29,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +17: [2023-05-13 03:28:29,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +17: [2023-05-13 03:28:29,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +24: [2023-05-13 03:28:29,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +10: [2023-05-13 03:28:29,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +10: [2023-05-13 03:28:29,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +10: [2023-05-13 03:28:29,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +27: [2023-05-13 03:28:29,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +27: [2023-05-13 03:28:29,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +27: [2023-05-13 03:28:29,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +27: [2023-05-13 03:28:29,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +27: [2023-05-13 03:28:29,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +25: [2023-05-13 03:28:29,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +25: [2023-05-13 03:28:29,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +24: [2023-05-13 03:28:29,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +17: [2023-05-13 03:28:29,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +17: [2023-05-13 03:28:29,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +17: [2023-05-13 03:28:29,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +24: [2023-05-13 03:28:29,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:29,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +17: [2023-05-13 03:28:29,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +17: [2023-05-13 03:28:29,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +25: [2023-05-13 03:28:29,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +25: [2023-05-13 03:28:29,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +25: [2023-05-13 03:28:29,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +17: [2023-05-13 03:28:29,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +24: [2023-05-13 03:28:29,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +21: [2023-05-13 03:28:29,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +21: [2023-05-13 03:28:29,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +21: [2023-05-13 03:28:29,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +22: [2023-05-13 03:28:29,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +23: [2023-05-13 03:28:29,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +27: [2023-05-13 03:28:29,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +31: [2023-05-13 03:28:29,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +31: [2023-05-13 03:28:29,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +31: [2023-05-13 03:28:29,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +23: [2023-05-13 03:28:29,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +22: [2023-05-13 03:28:29,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +23: [2023-05-13 03:28:29,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +23: [2023-05-13 03:28:29,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +23: [2023-05-13 03:28:29,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +23: [2023-05-13 03:28:29,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +23: [2023-05-13 03:28:29,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +31: [2023-05-13 03:28:29,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +31: [2023-05-13 03:28:29,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +31: [2023-05-13 03:28:29,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +31: [2023-05-13 03:28:29,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +27: [2023-05-13 03:28:29,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +23: [2023-05-13 03:28:29,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +22: [2023-05-13 03:28:29,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:29,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +17: [2023-05-13 03:28:29,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +17: [2023-05-13 03:28:29,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:29,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +17: [2023-05-13 03:28:29,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:29,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:29,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +26: [2023-05-13 03:28:29,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +26: [2023-05-13 03:28:29,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +22: [2023-05-13 03:28:29,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +22: [2023-05-13 03:28:29,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +26: [2023-05-13 03:28:29,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +26: [2023-05-13 03:28:29,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +26: [2023-05-13 03:28:29,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +26: [2023-05-13 03:28:29,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +26: [2023-05-13 03:28:29,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +26: [2023-05-13 03:28:29,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +15: [2023-05-13 03:28:29,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +26: [2023-05-13 03:28:29,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +26: [2023-05-13 03:28:29,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +20: [2023-05-13 03:28:29,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +20: [2023-05-13 03:28:29,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 8: [2023-05-13 03:28:29,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +15: [2023-05-13 03:28:29,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 8: [2023-05-13 03:28:29,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +15: [2023-05-13 03:28:29,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +26: [2023-05-13 03:28:29,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +28: [2023-05-13 03:28:29,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +28: [2023-05-13 03:28:29,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +28: [2023-05-13 03:28:29,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +28: [2023-05-13 03:28:29,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 5: [2023-05-13 03:28:29,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +28: [2023-05-13 03:28:29,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +28: [2023-05-13 03:28:29,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +28: [2023-05-13 03:28:29,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +28: [2023-05-13 03:28:29,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +26: [2023-05-13 03:28:29,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +26: [2023-05-13 03:28:29,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +26: [2023-05-13 03:28:29,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +26: [2023-05-13 03:28:29,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +26: [2023-05-13 03:28:29,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +30: [2023-05-13 03:28:29,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +30: [2023-05-13 03:28:29,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +15: [2023-05-13 03:28:29,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:29,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +20: [2023-05-13 03:28:29,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +20: [2023-05-13 03:28:29,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +27: [2023-05-13 03:28:29,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +27: [2023-05-13 03:28:29,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +27: [2023-05-13 03:28:29,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:29,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +30: [2023-05-13 03:28:29,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +23: [2023-05-13 03:28:29,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +27: [2023-05-13 03:28:29,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +27: [2023-05-13 03:28:29,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:29,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +16: [2023-05-13 03:28:29,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +16: [2023-05-13 03:28:29,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +30: [2023-05-13 03:28:29,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +30: [2023-05-13 03:28:29,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +16: [2023-05-13 03:28:29,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +16: [2023-05-13 03:28:29,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +16: [2023-05-13 03:28:29,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +16: [2023-05-13 03:28:29,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +16: [2023-05-13 03:28:29,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +23: [2023-05-13 03:28:29,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:29,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +23: [2023-05-13 03:28:29,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:29,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +23: [2023-05-13 03:28:29,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +23: [2023-05-13 03:28:29,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +23: [2023-05-13 03:28:29,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:29,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +20: [2023-05-13 03:28:29,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +20: [2023-05-13 03:28:29,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +20: [2023-05-13 03:28:29,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +20: [2023-05-13 03:28:29,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +20: [2023-05-13 03:28:29,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +25: [2023-05-13 03:28:29,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +16: [2023-05-13 03:28:29,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +16: [2023-05-13 03:28:29,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +31: [2023-05-13 03:28:29,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +31: [2023-05-13 03:28:29,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +31: [2023-05-13 03:28:29,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +31: [2023-05-13 03:28:29,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +31: [2023-05-13 03:28:29,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:29,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +31: [2023-05-13 03:28:29,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:29,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:29,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +16: [2023-05-13 03:28:29,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +16: [2023-05-13 03:28:29,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt... +25: [2023-05-13 03:28:29,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +25: [2023-05-13 03:28:29,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 6: [2023-05-13 03:28:29,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 6: [2023-05-13 03:28:29,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:29,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +20: [2023-05-13 03:28:29,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +30: [2023-05-13 03:28:29,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:29,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +20: [2023-05-13 03:28:29,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +25: [2023-05-13 03:28:29,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 2: [2023-05-13 03:28:29,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:29,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +20: [2023-05-13 03:28:29,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +25: [2023-05-13 03:28:29,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +30: [2023-05-13 03:28:29,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +25: [2023-05-13 03:28:29,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +25: [2023-05-13 03:28:29,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +25: [2023-05-13 03:28:29,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +30: [2023-05-13 03:28:29,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:29,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +25: [2023-05-13 03:28:29,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 2: [2023-05-13 03:28:29,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:29,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:29,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +26: [2023-05-13 03:28:29,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +26: [2023-05-13 03:28:29,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +26: [2023-05-13 03:28:29,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +20: [2023-05-13 03:28:29,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +25: [2023-05-13 03:28:29,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +25: [2023-05-13 03:28:29,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +20: [2023-05-13 03:28:29,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +20: [2023-05-13 03:28:29,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +20: [2023-05-13 03:28:29,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:29,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +17: [2023-05-13 03:28:29,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 9: [2023-05-13 03:28:29,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +17: [2023-05-13 03:28:29,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +17: [2023-05-13 03:28:29,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +17: [2023-05-13 03:28:29,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +17: [2023-05-13 03:28:29,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +17: [2023-05-13 03:28:29,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +26: [2023-05-13 03:28:29,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +26: [2023-05-13 03:28:29,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +26: [2023-05-13 03:28:29,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +26: [2023-05-13 03:28:29,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +26: [2023-05-13 03:28:29,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +25: [2023-05-13 03:28:29,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +25: [2023-05-13 03:28:29,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +25: [2023-05-13 03:28:29,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +25: [2023-05-13 03:28:29,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:29,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +26: [2023-05-13 03:28:29,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +25: [2023-05-13 03:28:29,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +26: [2023-05-13 03:28:29,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +26: [2023-05-13 03:28:29,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 3: [2023-05-13 03:28:29,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +16: [2023-05-13 03:28:29,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +16: [2023-05-13 03:28:29,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +16: [2023-05-13 03:28:29,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +16: [2023-05-13 03:28:29,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:29,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:29,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. +16: [2023-05-13 03:28:29,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_20-model_00-model_states.pt. + 1: [2023-05-13 03:28:29,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:29,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:29,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +26: [2023-05-13 03:28:29,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +26: [2023-05-13 03:28:29,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +26: [2023-05-13 03:28:29,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 1: [2023-05-13 03:28:29,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +26: [2023-05-13 03:28:29,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +26: [2023-05-13 03:28:29,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:29,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:29,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:29,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:29,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:29,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:29,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:29,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:29,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 9: [2023-05-13 03:28:29,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:29,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:29,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:29,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:29,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:29,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 3: [2023-05-13 03:28:29,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +28: [2023-05-13 03:28:30,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +28: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +28: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +28: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +28: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +28: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +28: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +13: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +13: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +13: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +13: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +13: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +13: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +13: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +28: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +22: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +22: [2023-05-13 03:28:30,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +13: [2023-05-13 03:28:30,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +22: [2023-05-13 03:28:30,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +22: [2023-05-13 03:28:30,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +22: [2023-05-13 03:28:30,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +22: [2023-05-13 03:28:30,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +22: [2023-05-13 03:28:30,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +22: [2023-05-13 03:28:30,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +18: [2023-05-13 03:28:30,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +18: [2023-05-13 03:28:30,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +18: [2023-05-13 03:28:30,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +18: [2023-05-13 03:28:30,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +18: [2023-05-13 03:28:30,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +18: [2023-05-13 03:28:30,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +18: [2023-05-13 03:28:30,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +27: [2023-05-13 03:28:30,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +18: [2023-05-13 03:28:30,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +28: [2023-05-13 03:28:30,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +27: [2023-05-13 03:28:30,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +27: [2023-05-13 03:28:30,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +27: [2023-05-13 03:28:30,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +27: [2023-05-13 03:28:30,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +27: [2023-05-13 03:28:30,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +27: [2023-05-13 03:28:30,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +27: [2023-05-13 03:28:30,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +13: [2023-05-13 03:28:30,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +22: [2023-05-13 03:28:30,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +22: [2023-05-13 03:28:30,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +13: [2023-05-13 03:28:30,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +13: [2023-05-13 03:28:30,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +13: [2023-05-13 03:28:30,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +13: [2023-05-13 03:28:30,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +13: [2023-05-13 03:28:30,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +18: [2023-05-13 03:28:30,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +18: [2023-05-13 03:28:30,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +18: [2023-05-13 03:28:30,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +27: [2023-05-13 03:28:30,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +13: [2023-05-13 03:28:30,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +13: [2023-05-13 03:28:30,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +18: [2023-05-13 03:28:30,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +28: [2023-05-13 03:28:30,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +18: [2023-05-13 03:28:30,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +22: [2023-05-13 03:28:30,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +28: [2023-05-13 03:28:30,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +22: [2023-05-13 03:28:30,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +18: [2023-05-13 03:28:30,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +28: [2023-05-13 03:28:30,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +22: [2023-05-13 03:28:30,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +28: [2023-05-13 03:28:30,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +18: [2023-05-13 03:28:30,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +22: [2023-05-13 03:28:30,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +28: [2023-05-13 03:28:30,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +18: [2023-05-13 03:28:30,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +28: [2023-05-13 03:28:30,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +22: [2023-05-13 03:28:30,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +22: [2023-05-13 03:28:30,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +28: [2023-05-13 03:28:30,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +27: [2023-05-13 03:28:30,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +27: [2023-05-13 03:28:30,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +27: [2023-05-13 03:28:30,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +27: [2023-05-13 03:28:30,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +27: [2023-05-13 03:28:30,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +27: [2023-05-13 03:28:30,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +27: [2023-05-13 03:28:30,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +28: [2023-05-13 03:28:30,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +19: [2023-05-13 03:28:30,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +19: [2023-05-13 03:28:30,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +19: [2023-05-13 03:28:30,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +19: [2023-05-13 03:28:30,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +19: [2023-05-13 03:28:30,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +19: [2023-05-13 03:28:30,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +19: [2023-05-13 03:28:30,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +19: [2023-05-13 03:28:30,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +13: [2023-05-13 03:28:30,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +13: [2023-05-13 03:28:30,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +27: [2023-05-13 03:28:30,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +22: [2023-05-13 03:28:30,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +22: [2023-05-13 03:28:30,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +13: [2023-05-13 03:28:30,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +18: [2023-05-13 03:28:30,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +18: [2023-05-13 03:28:30,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +18: [2023-05-13 03:28:30,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +19: [2023-05-13 03:28:30,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +19: [2023-05-13 03:28:30,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +19: [2023-05-13 03:28:30,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +19: [2023-05-13 03:28:30,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +19: [2023-05-13 03:28:30,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +18: [2023-05-13 03:28:30,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +19: [2023-05-13 03:28:30,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +19: [2023-05-13 03:28:30,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +19: [2023-05-13 03:28:30,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +28: [2023-05-13 03:28:30,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +28: [2023-05-13 03:28:30,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +31: [2023-05-13 03:28:30,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +31: [2023-05-13 03:28:30,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +18: [2023-05-13 03:28:30,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +13: [2023-05-13 03:28:30,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +31: [2023-05-13 03:28:30,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +31: [2023-05-13 03:28:30,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +31: [2023-05-13 03:28:30,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +31: [2023-05-13 03:28:30,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +31: [2023-05-13 03:28:30,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +31: [2023-05-13 03:28:30,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +13: [2023-05-13 03:28:30,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +13: [2023-05-13 03:28:30,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +13: [2023-05-13 03:28:30,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +13: [2023-05-13 03:28:30,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +12: [2023-05-13 03:28:30,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +12: [2023-05-13 03:28:30,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +12: [2023-05-13 03:28:30,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +12: [2023-05-13 03:28:30,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +12: [2023-05-13 03:28:30,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +12: [2023-05-13 03:28:30,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +12: [2023-05-13 03:28:30,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +12: [2023-05-13 03:28:30,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +31: [2023-05-13 03:28:30,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +31: [2023-05-13 03:28:30,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +22: [2023-05-13 03:28:30,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +22: [2023-05-13 03:28:30,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +13: [2023-05-13 03:28:30,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +13: [2023-05-13 03:28:30,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +18: [2023-05-13 03:28:30,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +18: [2023-05-13 03:28:30,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +18: [2023-05-13 03:28:30,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +27: [2023-05-13 03:28:30,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +12: [2023-05-13 03:28:30,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +12: [2023-05-13 03:28:30,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +12: [2023-05-13 03:28:30,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +12: [2023-05-13 03:28:30,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +12: [2023-05-13 03:28:30,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +12: [2023-05-13 03:28:30,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +12: [2023-05-13 03:28:30,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +31: [2023-05-13 03:28:30,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +31: [2023-05-13 03:28:30,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +12: [2023-05-13 03:28:30,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +22: [2023-05-13 03:28:30,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +22: [2023-05-13 03:28:30,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +22: [2023-05-13 03:28:30,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +31: [2023-05-13 03:28:30,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +31: [2023-05-13 03:28:30,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +31: [2023-05-13 03:28:30,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +31: [2023-05-13 03:28:30,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +18: [2023-05-13 03:28:30,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +18: [2023-05-13 03:28:30,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +18: [2023-05-13 03:28:30,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +13: [2023-05-13 03:28:30,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +27: [2023-05-13 03:28:30,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +18: [2023-05-13 03:28:30,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +28: [2023-05-13 03:28:30,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +28: [2023-05-13 03:28:30,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +28: [2023-05-13 03:28:30,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +28: [2023-05-13 03:28:30,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +28: [2023-05-13 03:28:30,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +28: [2023-05-13 03:28:30,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +22: [2023-05-13 03:28:30,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +27: [2023-05-13 03:28:30,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +22: [2023-05-13 03:28:30,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +28: [2023-05-13 03:28:30,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +27: [2023-05-13 03:28:30,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +27: [2023-05-13 03:28:30,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +27: [2023-05-13 03:28:30,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +27: [2023-05-13 03:28:30,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +27: [2023-05-13 03:28:30,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +13: [2023-05-13 03:28:30,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +18: [2023-05-13 03:28:30,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +13: [2023-05-13 03:28:30,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +22: [2023-05-13 03:28:30,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +20: [2023-05-13 03:28:30,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +20: [2023-05-13 03:28:30,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +13: [2023-05-13 03:28:30,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +22: [2023-05-13 03:28:30,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +13: [2023-05-13 03:28:30,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +13: [2023-05-13 03:28:30,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +20: [2023-05-13 03:28:30,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +20: [2023-05-13 03:28:30,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +20: [2023-05-13 03:28:30,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +20: [2023-05-13 03:28:30,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +20: [2023-05-13 03:28:30,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +20: [2023-05-13 03:28:30,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +22: [2023-05-13 03:28:30,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +20: [2023-05-13 03:28:30,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +18: [2023-05-13 03:28:30,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +18: [2023-05-13 03:28:30,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +20: [2023-05-13 03:28:30,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +22: [2023-05-13 03:28:30,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +18: [2023-05-13 03:28:30,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +22: [2023-05-13 03:28:30,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +20: [2023-05-13 03:28:30,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +20: [2023-05-13 03:28:30,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +20: [2023-05-13 03:28:30,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +19: [2023-05-13 03:28:30,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +20: [2023-05-13 03:28:30,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +20: [2023-05-13 03:28:30,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +20: [2023-05-13 03:28:30,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +27: [2023-05-13 03:28:30,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +19: [2023-05-13 03:28:30,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +28: [2023-05-13 03:28:30,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +19: [2023-05-13 03:28:30,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +27: [2023-05-13 03:28:30,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +22: [2023-05-13 03:28:30,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +28: [2023-05-13 03:28:30,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +26: [2023-05-13 03:28:30,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +26: [2023-05-13 03:28:30,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +28: [2023-05-13 03:28:30,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +31: [2023-05-13 03:28:30,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +31: [2023-05-13 03:28:30,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +28: [2023-05-13 03:28:30,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +19: [2023-05-13 03:28:30,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +19: [2023-05-13 03:28:30,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +26: [2023-05-13 03:28:30,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +22: [2023-05-13 03:28:30,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +26: [2023-05-13 03:28:30,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +26: [2023-05-13 03:28:30,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +26: [2023-05-13 03:28:30,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +26: [2023-05-13 03:28:30,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +26: [2023-05-13 03:28:30,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +15: [2023-05-13 03:28:30,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +28: [2023-05-13 03:28:30,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +15: [2023-05-13 03:28:30,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +15: [2023-05-13 03:28:30,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +15: [2023-05-13 03:28:30,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +15: [2023-05-13 03:28:30,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +15: [2023-05-13 03:28:30,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +15: [2023-05-13 03:28:30,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +15: [2023-05-13 03:28:30,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +25: [2023-05-13 03:28:30,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +25: [2023-05-13 03:28:30,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +28: [2023-05-13 03:28:30,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +27: [2023-05-13 03:28:30,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +19: [2023-05-13 03:28:30,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +19: [2023-05-13 03:28:30,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +19: [2023-05-13 03:28:30,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +25: [2023-05-13 03:28:30,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +26: [2023-05-13 03:28:30,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +26: [2023-05-13 03:28:30,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +26: [2023-05-13 03:28:30,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +25: [2023-05-13 03:28:30,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +29: [2023-05-13 03:28:30,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +25: [2023-05-13 03:28:30,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +25: [2023-05-13 03:28:30,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +25: [2023-05-13 03:28:30,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +21: [2023-05-13 03:28:30,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +21: [2023-05-13 03:28:30,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +25: [2023-05-13 03:28:30,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +29: [2023-05-13 03:28:30,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +12: [2023-05-13 03:28:30,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +12: [2023-05-13 03:28:30,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +17: [2023-05-13 03:28:30,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +15: [2023-05-13 03:28:30,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:30,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +17: [2023-05-13 03:28:30,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +17: [2023-05-13 03:28:30,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +17: [2023-05-13 03:28:30,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +17: [2023-05-13 03:28:30,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +17: [2023-05-13 03:28:30,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +17: [2023-05-13 03:28:30,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +21: [2023-05-13 03:28:30,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +11: [2023-05-13 03:28:30,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +29: [2023-05-13 03:28:30,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +21: [2023-05-13 03:28:30,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +21: [2023-05-13 03:28:30,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +29: [2023-05-13 03:28:30,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +21: [2023-05-13 03:28:30,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +21: [2023-05-13 03:28:30,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +24: [2023-05-13 03:28:30,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +24: [2023-05-13 03:28:30,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +29: [2023-05-13 03:28:30,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +29: [2023-05-13 03:28:30,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +29: [2023-05-13 03:28:30,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +11: [2023-05-13 03:28:30,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +11: [2023-05-13 03:28:30,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +11: [2023-05-13 03:28:30,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +21: [2023-05-13 03:28:30,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +29: [2023-05-13 03:28:30,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +24: [2023-05-13 03:28:30,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +24: [2023-05-13 03:28:30,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +24: [2023-05-13 03:28:30,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +24: [2023-05-13 03:28:30,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +24: [2023-05-13 03:28:30,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +29: [2023-05-13 03:28:30,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +11: [2023-05-13 03:28:30,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +11: [2023-05-13 03:28:30,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +11: [2023-05-13 03:28:30,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +11: [2023-05-13 03:28:30,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +24: [2023-05-13 03:28:30,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +12: [2023-05-13 03:28:30,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +25: [2023-05-13 03:28:30,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +25: [2023-05-13 03:28:30,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +11: [2023-05-13 03:28:30,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:30,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +21: [2023-05-13 03:28:30,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +25: [2023-05-13 03:28:30,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +21: [2023-05-13 03:28:30,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +21: [2023-05-13 03:28:30,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +26: [2023-05-13 03:28:30,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +27: [2023-05-13 03:28:30,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +26: [2023-05-13 03:28:30,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +10: [2023-05-13 03:28:30,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +10: [2023-05-13 03:28:30,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +10: [2023-05-13 03:28:30,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +27: [2023-05-13 03:28:30,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +10: [2023-05-13 03:28:30,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +10: [2023-05-13 03:28:30,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +10: [2023-05-13 03:28:30,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +10: [2023-05-13 03:28:30,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +26: [2023-05-13 03:28:30,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +10: [2023-05-13 03:28:30,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +14: [2023-05-13 03:28:30,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +14: [2023-05-13 03:28:30,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +26: [2023-05-13 03:28:30,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +29: [2023-05-13 03:28:30,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +25: [2023-05-13 03:28:30,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +25: [2023-05-13 03:28:30,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +19: [2023-05-13 03:28:30,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +14: [2023-05-13 03:28:30,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +26: [2023-05-13 03:28:30,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +14: [2023-05-13 03:28:30,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +14: [2023-05-13 03:28:30,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +14: [2023-05-13 03:28:30,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +14: [2023-05-13 03:28:30,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +24: [2023-05-13 03:28:30,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +14: [2023-05-13 03:28:30,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +24: [2023-05-13 03:28:30,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +25: [2023-05-13 03:28:30,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +25: [2023-05-13 03:28:30,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +29: [2023-05-13 03:28:30,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +25: [2023-05-13 03:28:30,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +24: [2023-05-13 03:28:30,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +15: [2023-05-13 03:28:30,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +15: [2023-05-13 03:28:30,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +15: [2023-05-13 03:28:30,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:30,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +30: [2023-05-13 03:28:30,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +30: [2023-05-13 03:28:30,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +24: [2023-05-13 03:28:30,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:30,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +30: [2023-05-13 03:28:30,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +10: [2023-05-13 03:28:30,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +27: [2023-05-13 03:28:30,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +24: [2023-05-13 03:28:30,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:30,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +30: [2023-05-13 03:28:30,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +15: [2023-05-13 03:28:30,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +10: [2023-05-13 03:28:30,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:30,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +27: [2023-05-13 03:28:30,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +21: [2023-05-13 03:28:30,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +21: [2023-05-13 03:28:30,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +15: [2023-05-13 03:28:30,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +21: [2023-05-13 03:28:30,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +21: [2023-05-13 03:28:30,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +24: [2023-05-13 03:28:30,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +24: [2023-05-13 03:28:30,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +15: [2023-05-13 03:28:30,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +15: [2023-05-13 03:28:30,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +21: [2023-05-13 03:28:30,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +24: [2023-05-13 03:28:30,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +17: [2023-05-13 03:28:30,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:30,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +29: [2023-05-13 03:28:30,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +14: [2023-05-13 03:28:30,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +29: [2023-05-13 03:28:30,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +12: [2023-05-13 03:28:30,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +12: [2023-05-13 03:28:30,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +12: [2023-05-13 03:28:30,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +12: [2023-05-13 03:28:30,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +12: [2023-05-13 03:28:30,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +17: [2023-05-13 03:28:30,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +29: [2023-05-13 03:28:30,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +11: [2023-05-13 03:28:30,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +14: [2023-05-13 03:28:30,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:30,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +14: [2023-05-13 03:28:30,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +14: [2023-05-13 03:28:30,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +14: [2023-05-13 03:28:30,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:30,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +29: [2023-05-13 03:28:30,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +11: [2023-05-13 03:28:30,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +14: [2023-05-13 03:28:30,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +11: [2023-05-13 03:28:30,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:30,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:30,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +29: [2023-05-13 03:28:30,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +11: [2023-05-13 03:28:30,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +11: [2023-05-13 03:28:30,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +10: [2023-05-13 03:28:30,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +31: [2023-05-13 03:28:30,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +10: [2023-05-13 03:28:30,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:30,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +31: [2023-05-13 03:28:30,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +14: [2023-05-13 03:28:30,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +10: [2023-05-13 03:28:30,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +11: [2023-05-13 03:28:30,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +14: [2023-05-13 03:28:30,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +10: [2023-05-13 03:28:30,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +11: [2023-05-13 03:28:30,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:30,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +10: [2023-05-13 03:28:30,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:30,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:30,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:30,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:30,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +10: [2023-05-13 03:28:30,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +19: [2023-05-13 03:28:30,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:30,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +30: [2023-05-13 03:28:30,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +12: [2023-05-13 03:28:30,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +31: [2023-05-13 03:28:30,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +31: [2023-05-13 03:28:30,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +31: [2023-05-13 03:28:30,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +31: [2023-05-13 03:28:30,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +31: [2023-05-13 03:28:30,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +31: [2023-05-13 03:28:30,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +19: [2023-05-13 03:28:30,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +12: [2023-05-13 03:28:30,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +19: [2023-05-13 03:28:30,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +19: [2023-05-13 03:28:30,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +19: [2023-05-13 03:28:30,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +19: [2023-05-13 03:28:30,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +20: [2023-05-13 03:28:30,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +20: [2023-05-13 03:28:30,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +12: [2023-05-13 03:28:30,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +19: [2023-05-13 03:28:30,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +12: [2023-05-13 03:28:30,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +12: [2023-05-13 03:28:30,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +12: [2023-05-13 03:28:30,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +12: [2023-05-13 03:28:30,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +20: [2023-05-13 03:28:30,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +20: [2023-05-13 03:28:30,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +11: [2023-05-13 03:28:30,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +12: [2023-05-13 03:28:30,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +29: [2023-05-13 03:28:30,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +26: [2023-05-13 03:28:30,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +16: [2023-05-13 03:28:30,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +16: [2023-05-13 03:28:30,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +31: [2023-05-13 03:28:30,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +15: [2023-05-13 03:28:30,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +16: [2023-05-13 03:28:30,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:30,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +16: [2023-05-13 03:28:30,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +16: [2023-05-13 03:28:30,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +16: [2023-05-13 03:28:30,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +16: [2023-05-13 03:28:30,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +16: [2023-05-13 03:28:30,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +31: [2023-05-13 03:28:30,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +31: [2023-05-13 03:28:30,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +16: [2023-05-13 03:28:30,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +10: [2023-05-13 03:28:30,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +31: [2023-05-13 03:28:30,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +31: [2023-05-13 03:28:30,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:30,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +26: [2023-05-13 03:28:30,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +26: [2023-05-13 03:28:30,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +20: [2023-05-13 03:28:30,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +20: [2023-05-13 03:28:30,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +31: [2023-05-13 03:28:30,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +20: [2023-05-13 03:28:30,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +20: [2023-05-13 03:28:30,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +20: [2023-05-13 03:28:30,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +20: [2023-05-13 03:28:30,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:30,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:30,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:30,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:30,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +14: [2023-05-13 03:28:30,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +21: [2023-05-13 03:28:30,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +21: [2023-05-13 03:28:30,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +21: [2023-05-13 03:28:30,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +16: [2023-05-13 03:28:30,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:30,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +29: [2023-05-13 03:28:30,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +23: [2023-05-13 03:28:30,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +23: [2023-05-13 03:28:30,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +23: [2023-05-13 03:28:30,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +23: [2023-05-13 03:28:30,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +23: [2023-05-13 03:28:30,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +23: [2023-05-13 03:28:30,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +23: [2023-05-13 03:28:30,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +23: [2023-05-13 03:28:30,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +25: [2023-05-13 03:28:30,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +25: [2023-05-13 03:28:30,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +25: [2023-05-13 03:28:30,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +25: [2023-05-13 03:28:30,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +25: [2023-05-13 03:28:30,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +11: [2023-05-13 03:28:30,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +24: [2023-05-13 03:28:30,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +21: [2023-05-13 03:28:30,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +10: [2023-05-13 03:28:30,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +24: [2023-05-13 03:28:30,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +24: [2023-05-13 03:28:30,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +24: [2023-05-13 03:28:30,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +29: [2023-05-13 03:28:30,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +23: [2023-05-13 03:28:30,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +23: [2023-05-13 03:28:30,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +26: [2023-05-13 03:28:30,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +26: [2023-05-13 03:28:30,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +26: [2023-05-13 03:28:30,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +25: [2023-05-13 03:28:30,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +30: [2023-05-13 03:28:30,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +30: [2023-05-13 03:28:30,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +14: [2023-05-13 03:28:30,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +26: [2023-05-13 03:28:30,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +14: [2023-05-13 03:28:30,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +26: [2023-05-13 03:28:30,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +26: [2023-05-13 03:28:30,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +23: [2023-05-13 03:28:30,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +23: [2023-05-13 03:28:30,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +23: [2023-05-13 03:28:30,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +10: [2023-05-13 03:28:30,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +17: [2023-05-13 03:28:30,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +15: [2023-05-13 03:28:30,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +20: [2023-05-13 03:28:30,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +30: [2023-05-13 03:28:30,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +20: [2023-05-13 03:28:30,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +30: [2023-05-13 03:28:30,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +21: [2023-05-13 03:28:30,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +26: [2023-05-13 03:28:30,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +21: [2023-05-13 03:28:30,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +21: [2023-05-13 03:28:30,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +21: [2023-05-13 03:28:30,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +26: [2023-05-13 03:28:30,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +24: [2023-05-13 03:28:30,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +14: [2023-05-13 03:28:30,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +15: [2023-05-13 03:28:30,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +14: [2023-05-13 03:28:30,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +14: [2023-05-13 03:28:30,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +14: [2023-05-13 03:28:30,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +14: [2023-05-13 03:28:30,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +14: [2023-05-13 03:28:30,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +24: [2023-05-13 03:28:30,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +24: [2023-05-13 03:28:30,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +24: [2023-05-13 03:28:30,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +25: [2023-05-13 03:28:30,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +25: [2023-05-13 03:28:30,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +30: [2023-05-13 03:28:30,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +30: [2023-05-13 03:28:30,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +30: [2023-05-13 03:28:30,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +30: [2023-05-13 03:28:30,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +29: [2023-05-13 03:28:30,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +29: [2023-05-13 03:28:30,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +15: [2023-05-13 03:28:30,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +15: [2023-05-13 03:28:30,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +15: [2023-05-13 03:28:30,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +20: [2023-05-13 03:28:30,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +10: [2023-05-13 03:28:30,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +20: [2023-05-13 03:28:30,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +29: [2023-05-13 03:28:30,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +29: [2023-05-13 03:28:30,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +21: [2023-05-13 03:28:30,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +21: [2023-05-13 03:28:30,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +21: [2023-05-13 03:28:30,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +29: [2023-05-13 03:28:30,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +29: [2023-05-13 03:28:30,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +29: [2023-05-13 03:28:30,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +10: [2023-05-13 03:28:30,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +11: [2023-05-13 03:28:30,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +11: [2023-05-13 03:28:30,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +11: [2023-05-13 03:28:30,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +20: [2023-05-13 03:28:30,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +15: [2023-05-13 03:28:30,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +15: [2023-05-13 03:28:30,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +15: [2023-05-13 03:28:30,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +21: [2023-05-13 03:28:30,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +10: [2023-05-13 03:28:30,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +10: [2023-05-13 03:28:30,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +10: [2023-05-13 03:28:30,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +10: [2023-05-13 03:28:30,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +10: [2023-05-13 03:28:30,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +25: [2023-05-13 03:28:30,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +25: [2023-05-13 03:28:30,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +25: [2023-05-13 03:28:30,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +25: [2023-05-13 03:28:30,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +24: [2023-05-13 03:28:30,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +17: [2023-05-13 03:28:30,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +17: [2023-05-13 03:28:30,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +17: [2023-05-13 03:28:30,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +17: [2023-05-13 03:28:30,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +17: [2023-05-13 03:28:30,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +17: [2023-05-13 03:28:30,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +17: [2023-05-13 03:28:30,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +11: [2023-05-13 03:28:30,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +11: [2023-05-13 03:28:30,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +11: [2023-05-13 03:28:30,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +11: [2023-05-13 03:28:30,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +24: [2023-05-13 03:28:30,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +20: [2023-05-13 03:28:30,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +24: [2023-05-13 03:28:30,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +25: [2023-05-13 03:28:30,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +24: [2023-05-13 03:28:30,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +26: [2023-05-13 03:28:30,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +30: [2023-05-13 03:28:30,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +26: [2023-05-13 03:28:30,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +26: [2023-05-13 03:28:30,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +30: [2023-05-13 03:28:30,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +14: [2023-05-13 03:28:30,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +14: [2023-05-13 03:28:30,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +30: [2023-05-13 03:28:30,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +21: [2023-05-13 03:28:30,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +16: [2023-05-13 03:28:30,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +30: [2023-05-13 03:28:30,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +25: [2023-05-13 03:28:30,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +26: [2023-05-13 03:28:30,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +26: [2023-05-13 03:28:30,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +21: [2023-05-13 03:28:30,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +25: [2023-05-13 03:28:30,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +24: [2023-05-13 03:28:30,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +21: [2023-05-13 03:28:30,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +21: [2023-05-13 03:28:30,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +25: [2023-05-13 03:28:30,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +24: [2023-05-13 03:28:30,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +14: [2023-05-13 03:28:30,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +24: [2023-05-13 03:28:30,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +24: [2023-05-13 03:28:30,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +14: [2023-05-13 03:28:30,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +14: [2023-05-13 03:28:30,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +10: [2023-05-13 03:28:30,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +30: [2023-05-13 03:28:30,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +14: [2023-05-13 03:28:30,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +14: [2023-05-13 03:28:30,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +15: [2023-05-13 03:28:30,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +29: [2023-05-13 03:28:30,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:30,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +30: [2023-05-13 03:28:30,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +30: [2023-05-13 03:28:30,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +29: [2023-05-13 03:28:30,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt... +16: [2023-05-13 03:28:30,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +16: [2023-05-13 03:28:30,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +16: [2023-05-13 03:28:30,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +29: [2023-05-13 03:28:30,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +16: [2023-05-13 03:28:30,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +11: [2023-05-13 03:28:30,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +15: [2023-05-13 03:28:30,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +30: [2023-05-13 03:28:30,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +15: [2023-05-13 03:28:30,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +15: [2023-05-13 03:28:30,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +15: [2023-05-13 03:28:30,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +16: [2023-05-13 03:28:30,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +29: [2023-05-13 03:28:30,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +10: [2023-05-13 03:28:30,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +29: [2023-05-13 03:28:30,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +29: [2023-05-13 03:28:30,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +11: [2023-05-13 03:28:30,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +11: [2023-05-13 03:28:30,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +10: [2023-05-13 03:28:30,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +16: [2023-05-13 03:28:30,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +10: [2023-05-13 03:28:30,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +15: [2023-05-13 03:28:30,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +15: [2023-05-13 03:28:30,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +11: [2023-05-13 03:28:30,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +11: [2023-05-13 03:28:30,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +16: [2023-05-13 03:28:30,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +10: [2023-05-13 03:28:30,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +10: [2023-05-13 03:28:30,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +17: [2023-05-13 03:28:30,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +17: [2023-05-13 03:28:30,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +17: [2023-05-13 03:28:30,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +17: [2023-05-13 03:28:30,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +17: [2023-05-13 03:28:30,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +11: [2023-05-13 03:28:30,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +11: [2023-05-13 03:28:30,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +17: [2023-05-13 03:28:30,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +17: [2023-05-13 03:28:30,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +16: [2023-05-13 03:28:30,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +16: [2023-05-13 03:28:30,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +16: [2023-05-13 03:28:30,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +16: [2023-05-13 03:28:30,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +16: [2023-05-13 03:28:30,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +23: [2023-05-13 03:28:30,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +23: [2023-05-13 03:28:30,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +16: [2023-05-13 03:28:30,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +16: [2023-05-13 03:28:30,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +23: [2023-05-13 03:28:30,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. +23: [2023-05-13 03:28:30,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_21-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +10: [2023-05-13 03:28:30,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +10: [2023-05-13 03:28:30,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +10: [2023-05-13 03:28:30,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +10: [2023-05-13 03:28:30,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +10: [2023-05-13 03:28:30,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +10: [2023-05-13 03:28:30,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +10: [2023-05-13 03:28:30,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +10: [2023-05-13 03:28:30,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +10: [2023-05-13 03:28:30,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +10: [2023-05-13 03:28:30,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +29: [2023-05-13 03:28:30,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +29: [2023-05-13 03:28:30,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +29: [2023-05-13 03:28:30,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +29: [2023-05-13 03:28:30,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +29: [2023-05-13 03:28:30,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +29: [2023-05-13 03:28:30,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +29: [2023-05-13 03:28:30,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +29: [2023-05-13 03:28:30,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +13: [2023-05-13 03:28:30,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +13: [2023-05-13 03:28:30,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +10: [2023-05-13 03:28:30,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +10: [2023-05-13 03:28:30,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +13: [2023-05-13 03:28:30,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +13: [2023-05-13 03:28:30,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +13: [2023-05-13 03:28:30,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +10: [2023-05-13 03:28:30,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +13: [2023-05-13 03:28:30,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +13: [2023-05-13 03:28:30,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +10: [2023-05-13 03:28:30,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +10: [2023-05-13 03:28:30,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +10: [2023-05-13 03:28:30,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +13: [2023-05-13 03:28:30,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +29: [2023-05-13 03:28:30,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +29: [2023-05-13 03:28:30,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +13: [2023-05-13 03:28:30,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +13: [2023-05-13 03:28:30,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +13: [2023-05-13 03:28:30,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +13: [2023-05-13 03:28:30,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +13: [2023-05-13 03:28:30,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +13: [2023-05-13 03:28:30,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +13: [2023-05-13 03:28:30,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +13: [2023-05-13 03:28:30,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +29: [2023-05-13 03:28:30,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +29: [2023-05-13 03:28:30,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +29: [2023-05-13 03:28:30,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +29: [2023-05-13 03:28:30,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +29: [2023-05-13 03:28:30,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +29: [2023-05-13 03:28:30,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +10: [2023-05-13 03:28:30,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +10: [2023-05-13 03:28:30,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +28: [2023-05-13 03:28:30,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +28: [2023-05-13 03:28:30,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +28: [2023-05-13 03:28:30,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +28: [2023-05-13 03:28:30,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +28: [2023-05-13 03:28:30,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +28: [2023-05-13 03:28:30,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +28: [2023-05-13 03:28:30,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +28: [2023-05-13 03:28:30,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +29: [2023-05-13 03:28:30,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +29: [2023-05-13 03:28:30,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +28: [2023-05-13 03:28:30,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +12: [2023-05-13 03:28:30,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +12: [2023-05-13 03:28:30,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +12: [2023-05-13 03:28:30,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +12: [2023-05-13 03:28:30,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +12: [2023-05-13 03:28:30,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +12: [2023-05-13 03:28:30,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +12: [2023-05-13 03:28:30,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +12: [2023-05-13 03:28:30,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +28: [2023-05-13 03:28:30,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +13: [2023-05-13 03:28:30,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +13: [2023-05-13 03:28:30,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +27: [2023-05-13 03:28:30,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +28: [2023-05-13 03:28:30,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +27: [2023-05-13 03:28:30,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +27: [2023-05-13 03:28:30,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +13: [2023-05-13 03:28:30,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +27: [2023-05-13 03:28:30,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +27: [2023-05-13 03:28:30,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +27: [2023-05-13 03:28:30,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +27: [2023-05-13 03:28:30,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +28: [2023-05-13 03:28:30,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +27: [2023-05-13 03:28:30,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +28: [2023-05-13 03:28:30,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +28: [2023-05-13 03:28:30,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +12: [2023-05-13 03:28:30,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +28: [2023-05-13 03:28:30,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +10: [2023-05-13 03:28:30,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +28: [2023-05-13 03:28:30,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +12: [2023-05-13 03:28:30,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +10: [2023-05-13 03:28:30,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +12: [2023-05-13 03:28:30,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +12: [2023-05-13 03:28:30,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +12: [2023-05-13 03:28:30,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +27: [2023-05-13 03:28:30,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +12: [2023-05-13 03:28:30,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +12: [2023-05-13 03:28:30,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +12: [2023-05-13 03:28:30,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +10: [2023-05-13 03:28:30,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +27: [2023-05-13 03:28:30,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +13: [2023-05-13 03:28:30,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +21: [2023-05-13 03:28:30,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +21: [2023-05-13 03:28:30,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +21: [2023-05-13 03:28:30,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +21: [2023-05-13 03:28:30,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +21: [2023-05-13 03:28:30,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +21: [2023-05-13 03:28:30,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +21: [2023-05-13 03:28:30,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +21: [2023-05-13 03:28:30,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +13: [2023-05-13 03:28:30,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +13: [2023-05-13 03:28:30,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +13: [2023-05-13 03:28:30,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +13: [2023-05-13 03:28:30,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +29: [2023-05-13 03:28:30,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +29: [2023-05-13 03:28:30,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +27: [2023-05-13 03:28:30,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +10: [2023-05-13 03:28:30,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +10: [2023-05-13 03:28:30,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +10: [2023-05-13 03:28:30,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +10: [2023-05-13 03:28:30,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +10: [2023-05-13 03:28:30,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +27: [2023-05-13 03:28:30,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +27: [2023-05-13 03:28:30,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +27: [2023-05-13 03:28:30,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +29: [2023-05-13 03:28:30,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +30: [2023-05-13 03:28:30,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +30: [2023-05-13 03:28:30,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +30: [2023-05-13 03:28:30,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +27: [2023-05-13 03:28:30,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +21: [2023-05-13 03:28:30,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +21: [2023-05-13 03:28:30,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +21: [2023-05-13 03:28:30,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +30: [2023-05-13 03:28:30,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +30: [2023-05-13 03:28:30,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +30: [2023-05-13 03:28:30,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +30: [2023-05-13 03:28:30,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +30: [2023-05-13 03:28:30,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +21: [2023-05-13 03:28:30,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +27: [2023-05-13 03:28:30,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +29: [2023-05-13 03:28:30,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +29: [2023-05-13 03:28:30,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +23: [2023-05-13 03:28:30,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +23: [2023-05-13 03:28:30,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +21: [2023-05-13 03:28:30,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +23: [2023-05-13 03:28:30,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +23: [2023-05-13 03:28:30,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +23: [2023-05-13 03:28:30,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +23: [2023-05-13 03:28:30,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +23: [2023-05-13 03:28:30,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +30: [2023-05-13 03:28:30,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +21: [2023-05-13 03:28:30,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +21: [2023-05-13 03:28:30,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +21: [2023-05-13 03:28:30,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +30: [2023-05-13 03:28:30,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +30: [2023-05-13 03:28:30,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +30: [2023-05-13 03:28:30,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +23: [2023-05-13 03:28:30,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +29: [2023-05-13 03:28:30,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +29: [2023-05-13 03:28:30,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +29: [2023-05-13 03:28:30,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +30: [2023-05-13 03:28:30,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +30: [2023-05-13 03:28:30,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +30: [2023-05-13 03:28:30,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +30: [2023-05-13 03:28:30,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +13: [2023-05-13 03:28:30,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +13: [2023-05-13 03:28:30,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +23: [2023-05-13 03:28:30,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +13: [2023-05-13 03:28:30,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +22: [2023-05-13 03:28:30,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +22: [2023-05-13 03:28:30,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +22: [2023-05-13 03:28:30,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +22: [2023-05-13 03:28:30,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +22: [2023-05-13 03:28:30,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +22: [2023-05-13 03:28:30,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +22: [2023-05-13 03:28:30,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +22: [2023-05-13 03:28:30,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +10: [2023-05-13 03:28:30,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +29: [2023-05-13 03:28:30,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +20: [2023-05-13 03:28:30,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +20: [2023-05-13 03:28:30,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +22: [2023-05-13 03:28:30,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +22: [2023-05-13 03:28:30,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +28: [2023-05-13 03:28:30,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +13: [2023-05-13 03:28:30,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +20: [2023-05-13 03:28:30,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +20: [2023-05-13 03:28:30,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +20: [2023-05-13 03:28:30,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +20: [2023-05-13 03:28:30,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +20: [2023-05-13 03:28:30,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +13: [2023-05-13 03:28:30,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +29: [2023-05-13 03:28:30,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +10: [2023-05-13 03:28:30,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +10: [2023-05-13 03:28:30,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +13: [2023-05-13 03:28:30,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +20: [2023-05-13 03:28:30,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +13: [2023-05-13 03:28:30,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +22: [2023-05-13 03:28:30,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +13: [2023-05-13 03:28:30,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +20: [2023-05-13 03:28:30,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +22: [2023-05-13 03:28:30,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +20: [2023-05-13 03:28:30,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +22: [2023-05-13 03:28:30,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +22: [2023-05-13 03:28:30,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +29: [2023-05-13 03:28:30,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +22: [2023-05-13 03:28:30,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +10: [2023-05-13 03:28:30,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +10: [2023-05-13 03:28:30,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +22: [2023-05-13 03:28:30,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +10: [2023-05-13 03:28:30,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +12: [2023-05-13 03:28:30,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 4: [2023-05-13 03:28:30,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +20: [2023-05-13 03:28:30,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +20: [2023-05-13 03:28:30,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +20: [2023-05-13 03:28:30,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 4: [2023-05-13 03:28:30,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +20: [2023-05-13 03:28:30,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +20: [2023-05-13 03:28:30,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +20: [2023-05-13 03:28:30,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +24: [2023-05-13 03:28:30,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +24: [2023-05-13 03:28:30,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +24: [2023-05-13 03:28:30,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +24: [2023-05-13 03:28:30,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +24: [2023-05-13 03:28:30,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +24: [2023-05-13 03:28:30,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +24: [2023-05-13 03:28:30,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +24: [2023-05-13 03:28:30,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +29: [2023-05-13 03:28:30,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +29: [2023-05-13 03:28:30,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +18: [2023-05-13 03:28:30,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +18: [2023-05-13 03:28:30,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +18: [2023-05-13 03:28:30,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +18: [2023-05-13 03:28:30,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +18: [2023-05-13 03:28:30,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +18: [2023-05-13 03:28:30,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +18: [2023-05-13 03:28:30,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +18: [2023-05-13 03:28:30,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +16: [2023-05-13 03:28:30,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +16: [2023-05-13 03:28:30,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +16: [2023-05-13 03:28:30,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +16: [2023-05-13 03:28:30,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +14: [2023-05-13 03:28:30,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +14: [2023-05-13 03:28:30,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +14: [2023-05-13 03:28:30,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +16: [2023-05-13 03:28:30,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +16: [2023-05-13 03:28:30,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +16: [2023-05-13 03:28:30,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +14: [2023-05-13 03:28:30,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +14: [2023-05-13 03:28:30,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +14: [2023-05-13 03:28:30,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +14: [2023-05-13 03:28:30,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +16: [2023-05-13 03:28:30,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +14: [2023-05-13 03:28:30,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +29: [2023-05-13 03:28:30,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +27: [2023-05-13 03:28:30,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +19: [2023-05-13 03:28:30,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +19: [2023-05-13 03:28:30,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +19: [2023-05-13 03:28:30,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +19: [2023-05-13 03:28:30,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +19: [2023-05-13 03:28:30,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +19: [2023-05-13 03:28:30,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +19: [2023-05-13 03:28:30,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +19: [2023-05-13 03:28:30,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +24: [2023-05-13 03:28:30,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +28: [2023-05-13 03:28:30,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +24: [2023-05-13 03:28:30,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +18: [2023-05-13 03:28:30,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +18: [2023-05-13 03:28:30,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +18: [2023-05-13 03:28:30,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +24: [2023-05-13 03:28:30,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +18: [2023-05-13 03:28:30,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +12: [2023-05-13 03:28:30,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +16: [2023-05-13 03:28:30,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +16: [2023-05-13 03:28:30,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +28: [2023-05-13 03:28:30,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +14: [2023-05-13 03:28:30,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +24: [2023-05-13 03:28:30,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +18: [2023-05-13 03:28:30,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +14: [2023-05-13 03:28:30,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +21: [2023-05-13 03:28:30,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +24: [2023-05-13 03:28:30,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +30: [2023-05-13 03:28:30,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +14: [2023-05-13 03:28:30,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +24: [2023-05-13 03:28:30,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +18: [2023-05-13 03:28:30,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +16: [2023-05-13 03:28:30,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +24: [2023-05-13 03:28:30,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +18: [2023-05-13 03:28:30,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +24: [2023-05-13 03:28:30,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +14: [2023-05-13 03:28:30,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +18: [2023-05-13 03:28:30,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +14: [2023-05-13 03:28:30,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +16: [2023-05-13 03:28:30,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +14: [2023-05-13 03:28:30,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +16: [2023-05-13 03:28:30,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +16: [2023-05-13 03:28:30,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +14: [2023-05-13 03:28:30,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +19: [2023-05-13 03:28:30,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +19: [2023-05-13 03:28:30,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +14: [2023-05-13 03:28:30,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +19: [2023-05-13 03:28:30,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +16: [2023-05-13 03:28:30,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +12: [2023-05-13 03:28:30,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +16: [2023-05-13 03:28:30,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +19: [2023-05-13 03:28:30,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +19: [2023-05-13 03:28:30,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +19: [2023-05-13 03:28:30,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +19: [2023-05-13 03:28:30,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +19: [2023-05-13 03:28:30,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +21: [2023-05-13 03:28:30,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +12: [2023-05-13 03:28:30,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +12: [2023-05-13 03:28:30,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +26: [2023-05-13 03:28:30,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +26: [2023-05-13 03:28:30,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +26: [2023-05-13 03:28:30,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +26: [2023-05-13 03:28:30,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +26: [2023-05-13 03:28:30,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +26: [2023-05-13 03:28:30,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +26: [2023-05-13 03:28:30,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +26: [2023-05-13 03:28:30,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +21: [2023-05-13 03:28:30,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +21: [2023-05-13 03:28:30,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +21: [2023-05-13 03:28:30,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +12: [2023-05-13 03:28:30,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +12: [2023-05-13 03:28:30,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +12: [2023-05-13 03:28:30,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +12: [2023-05-13 03:28:30,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +23: [2023-05-13 03:28:30,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +26: [2023-05-13 03:28:30,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +26: [2023-05-13 03:28:30,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +26: [2023-05-13 03:28:30,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +30: [2023-05-13 03:28:30,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +30: [2023-05-13 03:28:30,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +26: [2023-05-13 03:28:30,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +27: [2023-05-13 03:28:30,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +28: [2023-05-13 03:28:30,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +28: [2023-05-13 03:28:30,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +28: [2023-05-13 03:28:30,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +28: [2023-05-13 03:28:30,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +28: [2023-05-13 03:28:30,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +28: [2023-05-13 03:28:30,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +26: [2023-05-13 03:28:30,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +26: [2023-05-13 03:28:30,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +26: [2023-05-13 03:28:30,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +26: [2023-05-13 03:28:30,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +30: [2023-05-13 03:28:30,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +21: [2023-05-13 03:28:30,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +30: [2023-05-13 03:28:30,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +28: [2023-05-13 03:28:30,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +12: [2023-05-13 03:28:30,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +27: [2023-05-13 03:28:30,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +30: [2023-05-13 03:28:30,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +30: [2023-05-13 03:28:30,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +30: [2023-05-13 03:28:30,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +30: [2023-05-13 03:28:30,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +27: [2023-05-13 03:28:30,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +27: [2023-05-13 03:28:30,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +12: [2023-05-13 03:28:30,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +21: [2023-05-13 03:28:30,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +21: [2023-05-13 03:28:30,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +22: [2023-05-13 03:28:30,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +22: [2023-05-13 03:28:30,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +21: [2023-05-13 03:28:30,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +21: [2023-05-13 03:28:30,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +21: [2023-05-13 03:28:30,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +23: [2023-05-13 03:28:30,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +23: [2023-05-13 03:28:30,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +23: [2023-05-13 03:28:30,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +12: [2023-05-13 03:28:30,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +20: [2023-05-13 03:28:30,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +20: [2023-05-13 03:28:30,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +23: [2023-05-13 03:28:30,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +23: [2023-05-13 03:28:30,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +23: [2023-05-13 03:28:30,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +21: [2023-05-13 03:28:30,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +12: [2023-05-13 03:28:30,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +12: [2023-05-13 03:28:30,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +21: [2023-05-13 03:28:30,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +27: [2023-05-13 03:28:30,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +27: [2023-05-13 03:28:30,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +27: [2023-05-13 03:28:30,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +30: [2023-05-13 03:28:30,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +27: [2023-05-13 03:28:30,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +12: [2023-05-13 03:28:30,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +12: [2023-05-13 03:28:30,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +30: [2023-05-13 03:28:30,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +31: [2023-05-13 03:28:30,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +31: [2023-05-13 03:28:30,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +15: [2023-05-13 03:28:30,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +30: [2023-05-13 03:28:30,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +31: [2023-05-13 03:28:30,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +31: [2023-05-13 03:28:30,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +31: [2023-05-13 03:28:30,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +31: [2023-05-13 03:28:30,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +31: [2023-05-13 03:28:30,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +31: [2023-05-13 03:28:30,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +15: [2023-05-13 03:28:30,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +15: [2023-05-13 03:28:30,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +24: [2023-05-13 03:28:30,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +15: [2023-05-13 03:28:30,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +15: [2023-05-13 03:28:30,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +16: [2023-05-13 03:28:30,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +15: [2023-05-13 03:28:30,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +15: [2023-05-13 03:28:30,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +15: [2023-05-13 03:28:30,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +31: [2023-05-13 03:28:30,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +28: [2023-05-13 03:28:30,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +18: [2023-05-13 03:28:30,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +22: [2023-05-13 03:28:30,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +22: [2023-05-13 03:28:30,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +28: [2023-05-13 03:28:30,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +20: [2023-05-13 03:28:30,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +15: [2023-05-13 03:28:30,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +16: [2023-05-13 03:28:30,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +31: [2023-05-13 03:28:30,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +18: [2023-05-13 03:28:30,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +18: [2023-05-13 03:28:30,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +18: [2023-05-13 03:28:30,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +14: [2023-05-13 03:28:30,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +22: [2023-05-13 03:28:30,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +22: [2023-05-13 03:28:30,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +22: [2023-05-13 03:28:30,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +22: [2023-05-13 03:28:30,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +20: [2023-05-13 03:28:30,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +27: [2023-05-13 03:28:30,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +21: [2023-05-13 03:28:30,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +14: [2023-05-13 03:28:30,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +21: [2023-05-13 03:28:30,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +24: [2023-05-13 03:28:30,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +28: [2023-05-13 03:28:30,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +28: [2023-05-13 03:28:30,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +28: [2023-05-13 03:28:30,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +28: [2023-05-13 03:28:30,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +30: [2023-05-13 03:28:30,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +14: [2023-05-13 03:28:30,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +14: [2023-05-13 03:28:30,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +27: [2023-05-13 03:28:30,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +22: [2023-05-13 03:28:30,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +22: [2023-05-13 03:28:30,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +27: [2023-05-13 03:28:30,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +19: [2023-05-13 03:28:30,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +30: [2023-05-13 03:28:30,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +31: [2023-05-13 03:28:30,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +31: [2023-05-13 03:28:30,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +31: [2023-05-13 03:28:30,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +24: [2023-05-13 03:28:30,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +31: [2023-05-13 03:28:30,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +15: [2023-05-13 03:28:30,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +31: [2023-05-13 03:28:30,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +15: [2023-05-13 03:28:30,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +30: [2023-05-13 03:28:30,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +31: [2023-05-13 03:28:30,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +30: [2023-05-13 03:28:30,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +15: [2023-05-13 03:28:30,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +21: [2023-05-13 03:28:30,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +16: [2023-05-13 03:28:30,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +16: [2023-05-13 03:28:30,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +15: [2023-05-13 03:28:30,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +15: [2023-05-13 03:28:30,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +19: [2023-05-13 03:28:30,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +19: [2023-05-13 03:28:30,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +25: [2023-05-13 03:28:30,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +25: [2023-05-13 03:28:30,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 0: [2023-05-13 03:28:30,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +15: [2023-05-13 03:28:30,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +15: [2023-05-13 03:28:30,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +19: [2023-05-13 03:28:30,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +20: [2023-05-13 03:28:30,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +20: [2023-05-13 03:28:30,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +25: [2023-05-13 03:28:30,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +25: [2023-05-13 03:28:30,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +11: [2023-05-13 03:28:30,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +25: [2023-05-13 03:28:30,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +25: [2023-05-13 03:28:30,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +25: [2023-05-13 03:28:30,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +25: [2023-05-13 03:28:30,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 8: [2023-05-13 03:28:30,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +11: [2023-05-13 03:28:30,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +11: [2023-05-13 03:28:30,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +11: [2023-05-13 03:28:30,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +11: [2023-05-13 03:28:30,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +11: [2023-05-13 03:28:30,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +11: [2023-05-13 03:28:30,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +11: [2023-05-13 03:28:30,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +16: [2023-05-13 03:28:30,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +24: [2023-05-13 03:28:30,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +16: [2023-05-13 03:28:30,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +16: [2023-05-13 03:28:30,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +16: [2023-05-13 03:28:30,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +17: [2023-05-13 03:28:30,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 5: [2023-05-13 03:28:30,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +17: [2023-05-13 03:28:30,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +17: [2023-05-13 03:28:30,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +17: [2023-05-13 03:28:30,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +17: [2023-05-13 03:28:30,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +17: [2023-05-13 03:28:30,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +17: [2023-05-13 03:28:30,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +20: [2023-05-13 03:28:30,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +20: [2023-05-13 03:28:30,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +20: [2023-05-13 03:28:30,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +17: [2023-05-13 03:28:30,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +24: [2023-05-13 03:28:30,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +24: [2023-05-13 03:28:30,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +24: [2023-05-13 03:28:30,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +24: [2023-05-13 03:28:30,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +20: [2023-05-13 03:28:30,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +25: [2023-05-13 03:28:30,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +25: [2023-05-13 03:28:30,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +11: [2023-05-13 03:28:30,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +25: [2023-05-13 03:28:30,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +18: [2023-05-13 03:28:30,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +18: [2023-05-13 03:28:30,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +18: [2023-05-13 03:28:30,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +18: [2023-05-13 03:28:30,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +14: [2023-05-13 03:28:30,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +14: [2023-05-13 03:28:30,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +14: [2023-05-13 03:28:30,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +14: [2023-05-13 03:28:30,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +16: [2023-05-13 03:28:30,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +26: [2023-05-13 03:28:30,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +26: [2023-05-13 03:28:30,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +26: [2023-05-13 03:28:30,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +26: [2023-05-13 03:28:30,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +17: [2023-05-13 03:28:30,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +24: [2023-05-13 03:28:30,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +25: [2023-05-13 03:28:30,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +25: [2023-05-13 03:28:30,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +25: [2023-05-13 03:28:30,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +19: [2023-05-13 03:28:30,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +25: [2023-05-13 03:28:30,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +25: [2023-05-13 03:28:30,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +11: [2023-05-13 03:28:30,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +27: [2023-05-13 03:28:30,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:30,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +18: [2023-05-13 03:28:30,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:30,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +23: [2023-05-13 03:28:30,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +23: [2023-05-13 03:28:30,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +23: [2023-05-13 03:28:30,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +23: [2023-05-13 03:28:30,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +23: [2023-05-13 03:28:30,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +23: [2023-05-13 03:28:30,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +23: [2023-05-13 03:28:30,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +23: [2023-05-13 03:28:30,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +19: [2023-05-13 03:28:30,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +19: [2023-05-13 03:28:30,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +19: [2023-05-13 03:28:30,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 5: [2023-05-13 03:28:30,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +11: [2023-05-13 03:28:30,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +11: [2023-05-13 03:28:30,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +11: [2023-05-13 03:28:30,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +16: [2023-05-13 03:28:30,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:30,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +20: [2023-05-13 03:28:30,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +14: [2023-05-13 03:28:30,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +17: [2023-05-13 03:28:30,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +20: [2023-05-13 03:28:30,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +27: [2023-05-13 03:28:30,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +17: [2023-05-13 03:28:30,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +17: [2023-05-13 03:28:30,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +18: [2023-05-13 03:28:30,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +18: [2023-05-13 03:28:30,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +17: [2023-05-13 03:28:30,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +18: [2023-05-13 03:28:30,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +17: [2023-05-13 03:28:30,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +27: [2023-05-13 03:28:30,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +27: [2023-05-13 03:28:30,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +17: [2023-05-13 03:28:30,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... +22: [2023-05-13 03:28:30,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +17: [2023-05-13 03:28:30,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt... + 0: [2023-05-13 03:28:30,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +24: [2023-05-13 03:28:30,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +16: [2023-05-13 03:28:30,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +26: [2023-05-13 03:28:30,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +26: [2023-05-13 03:28:30,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +19: [2023-05-13 03:28:30,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +19: [2023-05-13 03:28:30,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +22: [2023-05-13 03:28:30,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +16: [2023-05-13 03:28:30,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +14: [2023-05-13 03:28:30,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +14: [2023-05-13 03:28:30,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +26: [2023-05-13 03:28:30,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 7: [2023-05-13 03:28:30,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +14: [2023-05-13 03:28:30,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +19: [2023-05-13 03:28:30,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +22: [2023-05-13 03:28:30,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +26: [2023-05-13 03:28:30,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +22: [2023-05-13 03:28:30,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +22: [2023-05-13 03:28:30,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +22: [2023-05-13 03:28:30,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +24: [2023-05-13 03:28:30,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +19: [2023-05-13 03:28:30,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +16: [2023-05-13 03:28:30,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +16: [2023-05-13 03:28:30,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +31: [2023-05-13 03:28:30,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 1: [2023-05-13 03:28:30,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 7: [2023-05-13 03:28:30,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +24: [2023-05-13 03:28:30,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +18: [2023-05-13 03:28:30,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 1: [2023-05-13 03:28:30,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +16: [2023-05-13 03:28:30,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +18: [2023-05-13 03:28:30,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +20: [2023-05-13 03:28:30,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +16: [2023-05-13 03:28:30,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +26: [2023-05-13 03:28:30,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +26: [2023-05-13 03:28:30,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +18: [2023-05-13 03:28:30,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +18: [2023-05-13 03:28:30,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +26: [2023-05-13 03:28:30,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +26: [2023-05-13 03:28:30,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +24: [2023-05-13 03:28:30,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +14: [2023-05-13 03:28:30,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +14: [2023-05-13 03:28:30,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +15: [2023-05-13 03:28:30,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +20: [2023-05-13 03:28:30,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +20: [2023-05-13 03:28:30,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:30,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +14: [2023-05-13 03:28:30,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +14: [2023-05-13 03:28:30,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +20: [2023-05-13 03:28:30,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +19: [2023-05-13 03:28:30,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 6: [2023-05-13 03:28:30,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +24: [2023-05-13 03:28:30,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +24: [2023-05-13 03:28:30,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +24: [2023-05-13 03:28:30,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +19: [2023-05-13 03:28:30,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +19: [2023-05-13 03:28:30,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +31: [2023-05-13 03:28:30,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +19: [2023-05-13 03:28:30,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +26: [2023-05-13 03:28:30,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +26: [2023-05-13 03:28:30,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +26: [2023-05-13 03:28:30,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +26: [2023-05-13 03:28:30,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +31: [2023-05-13 03:28:30,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:30,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +17: [2023-05-13 03:28:30,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +31: [2023-05-13 03:28:30,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +15: [2023-05-13 03:28:30,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +25: [2023-05-13 03:28:30,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +25: [2023-05-13 03:28:30,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +25: [2023-05-13 03:28:30,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +31: [2023-05-13 03:28:30,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +31: [2023-05-13 03:28:30,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +31: [2023-05-13 03:28:30,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +31: [2023-05-13 03:28:30,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +25: [2023-05-13 03:28:30,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +31: [2023-05-13 03:28:30,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +31: [2023-05-13 03:28:30,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +15: [2023-05-13 03:28:30,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +15: [2023-05-13 03:28:30,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +15: [2023-05-13 03:28:30,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +15: [2023-05-13 03:28:30,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +15: [2023-05-13 03:28:30,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +15: [2023-05-13 03:28:30,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +11: [2023-05-13 03:28:30,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 3: [2023-05-13 03:28:30,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +15: [2023-05-13 03:28:30,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +25: [2023-05-13 03:28:30,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +25: [2023-05-13 03:28:30,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +25: [2023-05-13 03:28:30,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +25: [2023-05-13 03:28:30,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 3: [2023-05-13 03:28:30,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 9: [2023-05-13 03:28:30,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +17: [2023-05-13 03:28:30,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:30,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 6: [2023-05-13 03:28:30,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +31: [2023-05-13 03:28:30,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +25: [2023-05-13 03:28:30,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 2: [2023-05-13 03:28:30,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +25: [2023-05-13 03:28:30,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +25: [2023-05-13 03:28:30,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:30,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +11: [2023-05-13 03:28:30,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +11: [2023-05-13 03:28:30,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 2: [2023-05-13 03:28:30,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 9: [2023-05-13 03:28:30,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +17: [2023-05-13 03:28:31,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +17: [2023-05-13 03:28:31,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +17: [2023-05-13 03:28:31,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 2: [2023-05-13 03:28:31,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 2: [2023-05-13 03:28:31,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. + 2: [2023-05-13 03:28:31,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +17: [2023-05-13 03:28:31,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +17: [2023-05-13 03:28:31,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +17: [2023-05-13 03:28:31,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +17: [2023-05-13 03:28:31,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +11: [2023-05-13 03:28:31,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +11: [2023-05-13 03:28:31,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +31: [2023-05-13 03:28:31,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 6: [2023-05-13 03:28:31,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +31: [2023-05-13 03:28:31,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +31: [2023-05-13 03:28:31,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:31,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_22-model_00-model_states.pt. +25: [2023-05-13 03:28:31,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +25: [2023-05-13 03:28:31,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +31: [2023-05-13 03:28:31,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +25: [2023-05-13 03:28:31,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +31: [2023-05-13 03:28:31,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +25: [2023-05-13 03:28:31,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:31,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +25: [2023-05-13 03:28:31,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +15: [2023-05-13 03:28:31,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +15: [2023-05-13 03:28:31,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 6: [2023-05-13 03:28:31,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 6: [2023-05-13 03:28:31,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +15: [2023-05-13 03:28:31,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 6: [2023-05-13 03:28:31,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 6: [2023-05-13 03:28:31,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 6: [2023-05-13 03:28:31,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +15: [2023-05-13 03:28:31,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +15: [2023-05-13 03:28:31,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +15: [2023-05-13 03:28:31,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +15: [2023-05-13 03:28:31,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:31,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:31,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:31,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:31,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:31,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 9: [2023-05-13 03:28:31,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +17: [2023-05-13 03:28:31,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:31,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +17: [2023-05-13 03:28:31,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +17: [2023-05-13 03:28:31,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 9: [2023-05-13 03:28:31,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 9: [2023-05-13 03:28:31,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +17: [2023-05-13 03:28:31,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 9: [2023-05-13 03:28:31,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 9: [2023-05-13 03:28:31,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +17: [2023-05-13 03:28:31,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +17: [2023-05-13 03:28:31,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +17: [2023-05-13 03:28:31,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 9: [2023-05-13 03:28:31,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 9: [2023-05-13 03:28:31,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +10: [2023-05-13 03:28:31,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +10: [2023-05-13 03:28:31,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +10: [2023-05-13 03:28:31,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +10: [2023-05-13 03:28:31,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +10: [2023-05-13 03:28:31,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +10: [2023-05-13 03:28:31,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +10: [2023-05-13 03:28:31,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +10: [2023-05-13 03:28:31,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +10: [2023-05-13 03:28:31,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +10: [2023-05-13 03:28:31,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +10: [2023-05-13 03:28:31,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +10: [2023-05-13 03:28:31,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +10: [2023-05-13 03:28:31,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +10: [2023-05-13 03:28:31,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +10: [2023-05-13 03:28:31,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +10: [2023-05-13 03:28:31,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +10: [2023-05-13 03:28:31,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +10: [2023-05-13 03:28:31,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +10: [2023-05-13 03:28:31,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +21: [2023-05-13 03:28:31,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +21: [2023-05-13 03:28:31,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +21: [2023-05-13 03:28:31,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +21: [2023-05-13 03:28:31,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +21: [2023-05-13 03:28:31,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +21: [2023-05-13 03:28:31,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +21: [2023-05-13 03:28:31,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +21: [2023-05-13 03:28:31,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +21: [2023-05-13 03:28:31,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +21: [2023-05-13 03:28:31,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +21: [2023-05-13 03:28:31,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +21: [2023-05-13 03:28:31,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +21: [2023-05-13 03:28:31,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +21: [2023-05-13 03:28:31,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +21: [2023-05-13 03:28:31,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +21: [2023-05-13 03:28:31,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +10: [2023-05-13 03:28:31,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +10: [2023-05-13 03:28:31,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +10: [2023-05-13 03:28:31,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +10: [2023-05-13 03:28:31,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +10: [2023-05-13 03:28:31,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +10: [2023-05-13 03:28:31,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +10: [2023-05-13 03:28:31,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +10: [2023-05-13 03:28:31,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +10: [2023-05-13 03:28:31,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +10: [2023-05-13 03:28:31,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +10: [2023-05-13 03:28:31,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +10: [2023-05-13 03:28:31,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +10: [2023-05-13 03:28:31,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +13: [2023-05-13 03:28:31,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 4: [2023-05-13 03:28:31,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 4: [2023-05-13 03:28:31,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 4: [2023-05-13 03:28:31,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 4: [2023-05-13 03:28:31,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 4: [2023-05-13 03:28:31,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 4: [2023-05-13 03:28:31,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 4: [2023-05-13 03:28:31,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 4: [2023-05-13 03:28:31,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +13: [2023-05-13 03:28:31,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +13: [2023-05-13 03:28:31,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 8: [2023-05-13 03:28:31,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +13: [2023-05-13 03:28:31,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 8: [2023-05-13 03:28:31,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 8: [2023-05-13 03:28:31,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 8: [2023-05-13 03:28:31,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 8: [2023-05-13 03:28:31,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 4: [2023-05-13 03:28:31,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 4: [2023-05-13 03:28:31,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +13: [2023-05-13 03:28:31,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +21: [2023-05-13 03:28:31,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +21: [2023-05-13 03:28:31,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +21: [2023-05-13 03:28:31,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +21: [2023-05-13 03:28:31,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 8: [2023-05-13 03:28:31,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +13: [2023-05-13 03:28:31,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 4: [2023-05-13 03:28:31,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 4: [2023-05-13 03:28:31,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 4: [2023-05-13 03:28:31,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 4: [2023-05-13 03:28:31,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 4: [2023-05-13 03:28:31,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 4: [2023-05-13 03:28:31,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +27: [2023-05-13 03:28:31,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +27: [2023-05-13 03:28:31,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +27: [2023-05-13 03:28:31,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +27: [2023-05-13 03:28:31,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +27: [2023-05-13 03:28:31,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +27: [2023-05-13 03:28:31,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +27: [2023-05-13 03:28:31,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +27: [2023-05-13 03:28:31,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 8: [2023-05-13 03:28:31,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +27: [2023-05-13 03:28:31,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +27: [2023-05-13 03:28:31,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +21: [2023-05-13 03:28:31,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +21: [2023-05-13 03:28:31,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +21: [2023-05-13 03:28:31,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +21: [2023-05-13 03:28:31,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +27: [2023-05-13 03:28:31,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +27: [2023-05-13 03:28:31,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +27: [2023-05-13 03:28:31,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +27: [2023-05-13 03:28:31,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +27: [2023-05-13 03:28:31,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +27: [2023-05-13 03:28:31,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +21: [2023-05-13 03:28:31,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +21: [2023-05-13 03:28:31,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +21: [2023-05-13 03:28:31,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +21: [2023-05-13 03:28:31,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +21: [2023-05-13 03:28:31,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +21: [2023-05-13 03:28:31,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +21: [2023-05-13 03:28:31,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +21: [2023-05-13 03:28:31,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 8: [2023-05-13 03:28:31,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 8: [2023-05-13 03:28:31,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 4: [2023-05-13 03:28:31,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 4: [2023-05-13 03:28:31,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 4: [2023-05-13 03:28:31,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 4: [2023-05-13 03:28:31,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 4: [2023-05-13 03:28:31,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 4: [2023-05-13 03:28:31,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 4: [2023-05-13 03:28:31,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +27: [2023-05-13 03:28:31,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 4: [2023-05-13 03:28:31,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 8: [2023-05-13 03:28:31,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +27: [2023-05-13 03:28:31,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 8: [2023-05-13 03:28:31,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 8: [2023-05-13 03:28:31,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 4: [2023-05-13 03:28:31,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 4: [2023-05-13 03:28:31,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 4: [2023-05-13 03:28:31,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 8: [2023-05-13 03:28:31,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 8: [2023-05-13 03:28:31,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +27: [2023-05-13 03:28:31,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +13: [2023-05-13 03:28:31,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +13: [2023-05-13 03:28:31,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 4: [2023-05-13 03:28:31,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 4: [2023-05-13 03:28:31,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +23: [2023-05-13 03:28:31,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +23: [2023-05-13 03:28:31,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 4: [2023-05-13 03:28:31,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 4: [2023-05-13 03:28:31,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +23: [2023-05-13 03:28:31,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +23: [2023-05-13 03:28:31,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +23: [2023-05-13 03:28:31,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +23: [2023-05-13 03:28:31,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +23: [2023-05-13 03:28:31,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +23: [2023-05-13 03:28:31,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +28: [2023-05-13 03:28:31,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +28: [2023-05-13 03:28:31,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +28: [2023-05-13 03:28:31,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +28: [2023-05-13 03:28:31,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +28: [2023-05-13 03:28:31,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +28: [2023-05-13 03:28:31,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +28: [2023-05-13 03:28:31,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +28: [2023-05-13 03:28:31,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 4: [2023-05-13 03:28:31,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +23: [2023-05-13 03:28:31,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +28: [2023-05-13 03:28:31,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +23: [2023-05-13 03:28:31,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +13: [2023-05-13 03:28:31,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +13: [2023-05-13 03:28:31,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +13: [2023-05-13 03:28:31,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +20: [2023-05-13 03:28:31,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +20: [2023-05-13 03:28:31,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +27: [2023-05-13 03:28:31,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +28: [2023-05-13 03:28:31,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +20: [2023-05-13 03:28:31,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +20: [2023-05-13 03:28:31,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +20: [2023-05-13 03:28:31,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +20: [2023-05-13 03:28:31,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +20: [2023-05-13 03:28:31,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +20: [2023-05-13 03:28:31,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +23: [2023-05-13 03:28:31,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +23: [2023-05-13 03:28:31,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +23: [2023-05-13 03:28:31,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +23: [2023-05-13 03:28:31,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +27: [2023-05-13 03:28:31,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +23: [2023-05-13 03:28:31,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +23: [2023-05-13 03:28:31,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +28: [2023-05-13 03:28:31,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +28: [2023-05-13 03:28:31,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +28: [2023-05-13 03:28:31,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +28: [2023-05-13 03:28:31,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +20: [2023-05-13 03:28:31,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +20: [2023-05-13 03:28:31,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +28: [2023-05-13 03:28:31,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +28: [2023-05-13 03:28:31,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +20: [2023-05-13 03:28:31,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +20: [2023-05-13 03:28:31,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +27: [2023-05-13 03:28:31,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +27: [2023-05-13 03:28:31,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +27: [2023-05-13 03:28:31,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +27: [2023-05-13 03:28:31,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +27: [2023-05-13 03:28:31,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +20: [2023-05-13 03:28:31,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +20: [2023-05-13 03:28:31,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +20: [2023-05-13 03:28:31,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +20: [2023-05-13 03:28:31,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +27: [2023-05-13 03:28:31,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +23: [2023-05-13 03:28:31,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +27: [2023-05-13 03:28:31,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +27: [2023-05-13 03:28:31,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +28: [2023-05-13 03:28:31,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +27: [2023-05-13 03:28:31,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +27: [2023-05-13 03:28:31,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 3: [2023-05-13 03:28:31,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 3: [2023-05-13 03:28:31,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +27: [2023-05-13 03:28:31,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 3: [2023-05-13 03:28:31,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 3: [2023-05-13 03:28:31,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 3: [2023-05-13 03:28:31,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 3: [2023-05-13 03:28:31,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 3: [2023-05-13 03:28:31,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 3: [2023-05-13 03:28:31,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +23: [2023-05-13 03:28:31,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 3: [2023-05-13 03:28:31,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 3: [2023-05-13 03:28:31,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +16: [2023-05-13 03:28:31,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +16: [2023-05-13 03:28:31,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +16: [2023-05-13 03:28:31,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +16: [2023-05-13 03:28:31,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +16: [2023-05-13 03:28:31,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +16: [2023-05-13 03:28:31,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +16: [2023-05-13 03:28:31,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +16: [2023-05-13 03:28:31,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 3: [2023-05-13 03:28:31,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 3: [2023-05-13 03:28:31,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +16: [2023-05-13 03:28:31,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 3: [2023-05-13 03:28:31,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +20: [2023-05-13 03:28:31,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +20: [2023-05-13 03:28:31,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 3: [2023-05-13 03:28:31,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 3: [2023-05-13 03:28:31,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 3: [2023-05-13 03:28:31,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +16: [2023-05-13 03:28:31,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +16: [2023-05-13 03:28:31,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +16: [2023-05-13 03:28:31,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +16: [2023-05-13 03:28:31,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +16: [2023-05-13 03:28:31,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +28: [2023-05-13 03:28:31,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +16: [2023-05-13 03:28:31,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +16: [2023-05-13 03:28:31,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +28: [2023-05-13 03:28:31,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +23: [2023-05-13 03:28:31,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +20: [2023-05-13 03:28:31,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +23: [2023-05-13 03:28:31,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +23: [2023-05-13 03:28:31,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +23: [2023-05-13 03:28:31,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +20: [2023-05-13 03:28:31,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +23: [2023-05-13 03:28:31,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +23: [2023-05-13 03:28:31,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +23: [2023-05-13 03:28:31,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +23: [2023-05-13 03:28:31,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +28: [2023-05-13 03:28:31,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +28: [2023-05-13 03:28:31,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +18: [2023-05-13 03:28:31,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +18: [2023-05-13 03:28:31,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +28: [2023-05-13 03:28:31,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +28: [2023-05-13 03:28:31,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +28: [2023-05-13 03:28:31,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +28: [2023-05-13 03:28:31,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +18: [2023-05-13 03:28:31,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +28: [2023-05-13 03:28:31,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +18: [2023-05-13 03:28:31,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +18: [2023-05-13 03:28:31,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +18: [2023-05-13 03:28:31,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +18: [2023-05-13 03:28:31,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +18: [2023-05-13 03:28:31,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +20: [2023-05-13 03:28:31,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +20: [2023-05-13 03:28:31,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +20: [2023-05-13 03:28:31,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +20: [2023-05-13 03:28:31,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +18: [2023-05-13 03:28:31,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +18: [2023-05-13 03:28:31,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +18: [2023-05-13 03:28:31,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +20: [2023-05-13 03:28:31,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +18: [2023-05-13 03:28:31,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +18: [2023-05-13 03:28:31,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +18: [2023-05-13 03:28:31,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +22: [2023-05-13 03:28:31,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +22: [2023-05-13 03:28:31,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +18: [2023-05-13 03:28:31,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +22: [2023-05-13 03:28:31,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +22: [2023-05-13 03:28:31,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +20: [2023-05-13 03:28:31,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +22: [2023-05-13 03:28:31,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +22: [2023-05-13 03:28:31,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +22: [2023-05-13 03:28:31,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +22: [2023-05-13 03:28:31,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +18: [2023-05-13 03:28:31,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +22: [2023-05-13 03:28:31,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +22: [2023-05-13 03:28:31,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +22: [2023-05-13 03:28:31,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +20: [2023-05-13 03:28:31,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +15: [2023-05-13 03:28:31,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +15: [2023-05-13 03:28:31,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +15: [2023-05-13 03:28:31,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +15: [2023-05-13 03:28:31,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +15: [2023-05-13 03:28:31,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +15: [2023-05-13 03:28:31,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +15: [2023-05-13 03:28:31,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +15: [2023-05-13 03:28:31,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 3: [2023-05-13 03:28:31,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 3: [2023-05-13 03:28:31,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +23: [2023-05-13 03:28:31,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +22: [2023-05-13 03:28:31,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +22: [2023-05-13 03:28:31,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +22: [2023-05-13 03:28:31,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +23: [2023-05-13 03:28:31,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +22: [2023-05-13 03:28:31,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +15: [2023-05-13 03:28:31,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 0: [2023-05-13 03:28:31,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 0: [2023-05-13 03:28:31,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 0: [2023-05-13 03:28:31,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 0: [2023-05-13 03:28:31,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 0: [2023-05-13 03:28:31,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 0: [2023-05-13 03:28:31,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 0: [2023-05-13 03:28:31,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +20: [2023-05-13 03:28:31,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 0: [2023-05-13 03:28:31,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +22: [2023-05-13 03:28:31,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +23: [2023-05-13 03:28:31,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +16: [2023-05-13 03:28:31,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 0: [2023-05-13 03:28:31,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +23: [2023-05-13 03:28:31,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +23: [2023-05-13 03:28:31,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +23: [2023-05-13 03:28:31,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +15: [2023-05-13 03:28:31,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 0: [2023-05-13 03:28:31,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +15: [2023-05-13 03:28:31,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 0: [2023-05-13 03:28:31,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 0: [2023-05-13 03:28:31,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +15: [2023-05-13 03:28:31,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 0: [2023-05-13 03:28:31,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +15: [2023-05-13 03:28:31,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +15: [2023-05-13 03:28:31,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 0: [2023-05-13 03:28:31,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 0: [2023-05-13 03:28:31,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +15: [2023-05-13 03:28:31,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +15: [2023-05-13 03:28:31,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +20: [2023-05-13 03:28:31,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 0: [2023-05-13 03:28:31,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +20: [2023-05-13 03:28:31,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +28: [2023-05-13 03:28:31,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +16: [2023-05-13 03:28:31,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +16: [2023-05-13 03:28:31,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +28: [2023-05-13 03:28:31,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +28: [2023-05-13 03:28:31,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +28: [2023-05-13 03:28:31,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +20: [2023-05-13 03:28:31,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +28: [2023-05-13 03:28:31,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +28: [2023-05-13 03:28:31,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +16: [2023-05-13 03:28:31,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +16: [2023-05-13 03:28:31,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +20: [2023-05-13 03:28:31,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +16: [2023-05-13 03:28:31,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +16: [2023-05-13 03:28:31,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +16: [2023-05-13 03:28:31,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 3: [2023-05-13 03:28:31,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 3: [2023-05-13 03:28:31,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 3: [2023-05-13 03:28:31,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 3: [2023-05-13 03:28:31,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 3: [2023-05-13 03:28:31,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 3: [2023-05-13 03:28:31,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 3: [2023-05-13 03:28:31,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +16: [2023-05-13 03:28:31,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 3: [2023-05-13 03:28:31,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +16: [2023-05-13 03:28:31,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +18: [2023-05-13 03:28:31,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +18: [2023-05-13 03:28:31,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +18: [2023-05-13 03:28:31,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +16: [2023-05-13 03:28:31,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +16: [2023-05-13 03:28:31,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +16: [2023-05-13 03:28:31,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +16: [2023-05-13 03:28:31,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +18: [2023-05-13 03:28:31,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +16: [2023-05-13 03:28:31,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +22: [2023-05-13 03:28:31,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +16: [2023-05-13 03:28:31,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +15: [2023-05-13 03:28:31,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +22: [2023-05-13 03:28:31,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +22: [2023-05-13 03:28:31,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +18: [2023-05-13 03:28:31,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +18: [2023-05-13 03:28:31,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +18: [2023-05-13 03:28:31,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +18: [2023-05-13 03:28:31,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 3: [2023-05-13 03:28:31,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 3: [2023-05-13 03:28:31,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 3: [2023-05-13 03:28:31,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 3: [2023-05-13 03:28:31,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 0: [2023-05-13 03:28:31,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 3: [2023-05-13 03:28:31,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 3: [2023-05-13 03:28:31,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +18: [2023-05-13 03:28:31,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +18: [2023-05-13 03:28:31,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +18: [2023-05-13 03:28:31,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +18: [2023-05-13 03:28:31,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:31,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +24: [2023-05-13 03:28:31,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +24: [2023-05-13 03:28:31,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +24: [2023-05-13 03:28:31,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +15: [2023-05-13 03:28:31,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:31,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +24: [2023-05-13 03:28:31,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +24: [2023-05-13 03:28:31,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +24: [2023-05-13 03:28:31,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +14: [2023-05-13 03:28:31,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +14: [2023-05-13 03:28:31,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +14: [2023-05-13 03:28:31,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +14: [2023-05-13 03:28:31,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +25: [2023-05-13 03:28:31,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +25: [2023-05-13 03:28:31,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +14: [2023-05-13 03:28:31,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +14: [2023-05-13 03:28:31,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +14: [2023-05-13 03:28:31,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +14: [2023-05-13 03:28:31,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +25: [2023-05-13 03:28:31,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +22: [2023-05-13 03:28:31,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +25: [2023-05-13 03:28:31,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +25: [2023-05-13 03:28:31,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +25: [2023-05-13 03:28:31,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +25: [2023-05-13 03:28:31,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +25: [2023-05-13 03:28:31,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +22: [2023-05-13 03:28:31,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +22: [2023-05-13 03:28:31,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +22: [2023-05-13 03:28:31,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +22: [2023-05-13 03:28:31,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +25: [2023-05-13 03:28:31,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +14: [2023-05-13 03:28:31,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +14: [2023-05-13 03:28:31,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +24: [2023-05-13 03:28:31,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +18: [2023-05-13 03:28:31,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:31,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +24: [2023-05-13 03:28:31,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +24: [2023-05-13 03:28:31,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +24: [2023-05-13 03:28:31,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +25: [2023-05-13 03:28:31,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +22: [2023-05-13 03:28:31,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +22: [2023-05-13 03:28:31,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +22: [2023-05-13 03:28:31,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +14: [2023-05-13 03:28:31,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +24: [2023-05-13 03:28:31,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +24: [2023-05-13 03:28:31,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +24: [2023-05-13 03:28:31,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +25: [2023-05-13 03:28:31,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +18: [2023-05-13 03:28:31,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +25: [2023-05-13 03:28:31,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 0: [2023-05-13 03:28:31,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +14: [2023-05-13 03:28:31,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +14: [2023-05-13 03:28:31,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +14: [2023-05-13 03:28:31,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +14: [2023-05-13 03:28:31,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +14: [2023-05-13 03:28:31,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +15: [2023-05-13 03:28:31,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +15: [2023-05-13 03:28:31,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 0: [2023-05-13 03:28:31,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +15: [2023-05-13 03:28:31,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +15: [2023-05-13 03:28:31,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +15: [2023-05-13 03:28:31,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +15: [2023-05-13 03:28:31,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +15: [2023-05-13 03:28:31,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +25: [2023-05-13 03:28:31,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +18: [2023-05-13 03:28:31,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +18: [2023-05-13 03:28:31,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +25: [2023-05-13 03:28:31,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 7: [2023-05-13 03:28:31,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 7: [2023-05-13 03:28:31,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 2: [2023-05-13 03:28:31,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 2: [2023-05-13 03:28:31,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 7: [2023-05-13 03:28:31,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 2: [2023-05-13 03:28:31,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 2: [2023-05-13 03:28:31,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 7: [2023-05-13 03:28:31,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 7: [2023-05-13 03:28:31,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 2: [2023-05-13 03:28:31,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 2: [2023-05-13 03:28:31,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 2: [2023-05-13 03:28:31,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 7: [2023-05-13 03:28:31,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 7: [2023-05-13 03:28:31,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +25: [2023-05-13 03:28:31,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +25: [2023-05-13 03:28:31,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 7: [2023-05-13 03:28:31,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +26: [2023-05-13 03:28:31,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +26: [2023-05-13 03:28:31,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +26: [2023-05-13 03:28:31,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +26: [2023-05-13 03:28:31,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +26: [2023-05-13 03:28:31,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +26: [2023-05-13 03:28:31,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +26: [2023-05-13 03:28:31,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 6: [2023-05-13 03:28:31,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +26: [2023-05-13 03:28:31,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +19: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +31: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 1: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 1: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 6: [2023-05-13 03:28:31,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 6: [2023-05-13 03:28:31,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 6: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 6: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 6: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 6: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +19: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +19: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +19: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +19: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +19: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +31: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +19: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 6: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +19: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +31: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +31: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +31: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +31: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +31: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 1: [2023-05-13 03:28:31,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +31: [2023-05-13 03:28:31,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 1: [2023-05-13 03:28:31,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 1: [2023-05-13 03:28:31,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 1: [2023-05-13 03:28:31,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 1: [2023-05-13 03:28:31,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +29: [2023-05-13 03:28:31,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +29: [2023-05-13 03:28:31,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 1: [2023-05-13 03:28:31,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +29: [2023-05-13 03:28:31,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +29: [2023-05-13 03:28:31,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +29: [2023-05-13 03:28:31,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +29: [2023-05-13 03:28:31,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +29: [2023-05-13 03:28:31,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +29: [2023-05-13 03:28:31,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 7: [2023-05-13 03:28:31,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 0: [2023-05-13 03:28:31,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 0: [2023-05-13 03:28:31,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 0: [2023-05-13 03:28:31,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 0: [2023-05-13 03:28:31,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 0: [2023-05-13 03:28:31,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 0: [2023-05-13 03:28:31,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 2: [2023-05-13 03:28:31,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +26: [2023-05-13 03:28:31,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 7: [2023-05-13 03:28:31,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +26: [2023-05-13 03:28:31,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 6: [2023-05-13 03:28:31,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 7: [2023-05-13 03:28:31,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +31: [2023-05-13 03:28:31,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +29: [2023-05-13 03:28:31,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +26: [2023-05-13 03:28:31,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 1: [2023-05-13 03:28:31,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +31: [2023-05-13 03:28:31,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 7: [2023-05-13 03:28:31,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +26: [2023-05-13 03:28:31,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 6: [2023-05-13 03:28:31,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 7: [2023-05-13 03:28:31,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +29: [2023-05-13 03:28:31,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 7: [2023-05-13 03:28:31,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 1: [2023-05-13 03:28:31,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +19: [2023-05-13 03:28:31,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +19: [2023-05-13 03:28:31,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +26: [2023-05-13 03:28:31,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 7: [2023-05-13 03:28:31,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 1: [2023-05-13 03:28:31,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 1: [2023-05-13 03:28:31,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 7: [2023-05-13 03:28:31,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 1: [2023-05-13 03:28:31,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +19: [2023-05-13 03:28:31,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +19: [2023-05-13 03:28:31,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 1: [2023-05-13 03:28:31,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 1: [2023-05-13 03:28:31,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +19: [2023-05-13 03:28:31,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 1: [2023-05-13 03:28:31,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +19: [2023-05-13 03:28:31,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +26: [2023-05-13 03:28:31,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +26: [2023-05-13 03:28:31,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +17: [2023-05-13 03:28:31,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 2: [2023-05-13 03:28:31,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +19: [2023-05-13 03:28:31,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +26: [2023-05-13 03:28:31,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +19: [2023-05-13 03:28:31,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +17: [2023-05-13 03:28:31,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +17: [2023-05-13 03:28:31,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +17: [2023-05-13 03:28:31,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +17: [2023-05-13 03:28:31,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +17: [2023-05-13 03:28:31,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +17: [2023-05-13 03:28:31,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +17: [2023-05-13 03:28:31,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 2: [2023-05-13 03:28:31,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +31: [2023-05-13 03:28:31,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 6: [2023-05-13 03:28:31,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +31: [2023-05-13 03:28:31,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:31,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +31: [2023-05-13 03:28:31,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 6: [2023-05-13 03:28:31,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 6: [2023-05-13 03:28:31,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 6: [2023-05-13 03:28:31,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:31,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +11: [2023-05-13 03:28:31,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +11: [2023-05-13 03:28:31,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +11: [2023-05-13 03:28:31,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +11: [2023-05-13 03:28:31,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +11: [2023-05-13 03:28:31,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +29: [2023-05-13 03:28:31,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +29: [2023-05-13 03:28:31,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:31,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +31: [2023-05-13 03:28:31,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 6: [2023-05-13 03:28:31,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +31: [2023-05-13 03:28:31,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +29: [2023-05-13 03:28:31,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +31: [2023-05-13 03:28:31,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 6: [2023-05-13 03:28:31,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +29: [2023-05-13 03:28:31,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +29: [2023-05-13 03:28:31,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:31,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +29: [2023-05-13 03:28:31,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +17: [2023-05-13 03:28:31,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +12: [2023-05-13 03:28:31,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +12: [2023-05-13 03:28:31,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +12: [2023-05-13 03:28:31,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +30: [2023-05-13 03:28:31,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +12: [2023-05-13 03:28:31,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +12: [2023-05-13 03:28:31,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +12: [2023-05-13 03:28:31,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +12: [2023-05-13 03:28:31,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +30: [2023-05-13 03:28:31,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +30: [2023-05-13 03:28:31,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +12: [2023-05-13 03:28:31,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +30: [2023-05-13 03:28:31,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +30: [2023-05-13 03:28:31,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +30: [2023-05-13 03:28:31,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +30: [2023-05-13 03:28:31,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +30: [2023-05-13 03:28:31,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +22: [2023-05-13 03:28:31,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +22: [2023-05-13 03:28:31,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +12: [2023-05-13 03:28:31,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +30: [2023-05-13 03:28:31,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +12: [2023-05-13 03:28:31,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +12: [2023-05-13 03:28:31,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +12: [2023-05-13 03:28:31,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +12: [2023-05-13 03:28:31,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 0: [2023-05-13 03:28:31,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +12: [2023-05-13 03:28:31,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +30: [2023-05-13 03:28:31,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +30: [2023-05-13 03:28:31,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +22: [2023-05-13 03:28:31,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +17: [2023-05-13 03:28:31,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +17: [2023-05-13 03:28:31,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +17: [2023-05-13 03:28:31,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +12: [2023-05-13 03:28:31,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +12: [2023-05-13 03:28:31,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +30: [2023-05-13 03:28:31,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +17: [2023-05-13 03:28:31,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:31,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:31,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +22: [2023-05-13 03:28:31,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +17: [2023-05-13 03:28:31,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +22: [2023-05-13 03:28:31,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +11: [2023-05-13 03:28:31,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +30: [2023-05-13 03:28:31,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +17: [2023-05-13 03:28:31,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +30: [2023-05-13 03:28:31,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:31,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +17: [2023-05-13 03:28:31,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:31,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +30: [2023-05-13 03:28:31,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:31,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +30: [2023-05-13 03:28:31,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +11: [2023-05-13 03:28:31,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +15: [2023-05-13 03:28:31,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 0: [2023-05-13 03:28:31,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +15: [2023-05-13 03:28:31,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 0: [2023-05-13 03:28:31,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 0: [2023-05-13 03:28:31,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +14: [2023-05-13 03:28:31,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +14: [2023-05-13 03:28:31,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +15: [2023-05-13 03:28:31,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 0: [2023-05-13 03:28:31,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +15: [2023-05-13 03:28:31,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +15: [2023-05-13 03:28:31,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +15: [2023-05-13 03:28:31,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +15: [2023-05-13 03:28:31,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 0: [2023-05-13 03:28:31,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 0: [2023-05-13 03:28:31,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +10: [2023-05-13 03:28:31,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +10: [2023-05-13 03:28:31,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +10: [2023-05-13 03:28:31,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +10: [2023-05-13 03:28:31,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +10: [2023-05-13 03:28:31,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +10: [2023-05-13 03:28:31,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +10: [2023-05-13 03:28:31,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +10: [2023-05-13 03:28:31,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +10: [2023-05-13 03:28:31,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +10: [2023-05-13 03:28:31,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +14: [2023-05-13 03:28:31,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +29: [2023-05-13 03:28:31,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +25: [2023-05-13 03:28:31,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +25: [2023-05-13 03:28:31,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +25: [2023-05-13 03:28:31,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +25: [2023-05-13 03:28:31,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +24: [2023-05-13 03:28:31,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +24: [2023-05-13 03:28:31,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +24: [2023-05-13 03:28:31,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 7: [2023-05-13 03:28:31,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +24: [2023-05-13 03:28:31,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +26: [2023-05-13 03:28:31,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +24: [2023-05-13 03:28:31,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +10: [2023-05-13 03:28:31,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +10: [2023-05-13 03:28:31,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +10: [2023-05-13 03:28:31,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +10: [2023-05-13 03:28:31,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +10: [2023-05-13 03:28:31,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +10: [2023-05-13 03:28:31,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 2: [2023-05-13 03:28:31,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +31: [2023-05-13 03:28:31,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +31: [2023-05-13 03:28:31,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +11: [2023-05-13 03:28:31,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +14: [2023-05-13 03:28:31,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 6: [2023-05-13 03:28:31,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +29: [2023-05-13 03:28:31,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +26: [2023-05-13 03:28:31,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 7: [2023-05-13 03:28:31,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +14: [2023-05-13 03:28:31,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +14: [2023-05-13 03:28:31,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +14: [2023-05-13 03:28:31,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +14: [2023-05-13 03:28:31,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 1: [2023-05-13 03:28:31,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 1: [2023-05-13 03:28:31,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +17: [2023-05-13 03:28:31,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +14: [2023-05-13 03:28:31,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +26: [2023-05-13 03:28:31,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +14: [2023-05-13 03:28:31,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 7: [2023-05-13 03:28:31,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 7: [2023-05-13 03:28:31,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +25: [2023-05-13 03:28:31,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +25: [2023-05-13 03:28:31,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +25: [2023-05-13 03:28:31,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +19: [2023-05-13 03:28:31,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +19: [2023-05-13 03:28:31,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +19: [2023-05-13 03:28:31,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +25: [2023-05-13 03:28:31,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 6: [2023-05-13 03:28:31,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +24: [2023-05-13 03:28:31,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +24: [2023-05-13 03:28:31,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +24: [2023-05-13 03:28:31,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +13: [2023-05-13 03:28:31,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +13: [2023-05-13 03:28:31,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +13: [2023-05-13 03:28:31,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +13: [2023-05-13 03:28:31,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +13: [2023-05-13 03:28:31,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +13: [2023-05-13 03:28:31,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +13: [2023-05-13 03:28:31,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 1: [2023-05-13 03:28:31,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 1: [2023-05-13 03:28:31,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 1: [2023-05-13 03:28:31,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 1: [2023-05-13 03:28:31,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 1: [2023-05-13 03:28:31,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 1: [2023-05-13 03:28:31,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +29: [2023-05-13 03:28:31,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +21: [2023-05-13 03:28:31,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +21: [2023-05-13 03:28:31,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +21: [2023-05-13 03:28:31,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +21: [2023-05-13 03:28:31,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +21: [2023-05-13 03:28:31,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +26: [2023-05-13 03:28:31,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +26: [2023-05-13 03:28:31,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +21: [2023-05-13 03:28:31,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +21: [2023-05-13 03:28:31,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +26: [2023-05-13 03:28:31,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +21: [2023-05-13 03:28:31,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 9: [2023-05-13 03:28:31,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +12: [2023-05-13 03:28:31,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +26: [2023-05-13 03:28:31,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 9: [2023-05-13 03:28:31,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 9: [2023-05-13 03:28:31,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +26: [2023-05-13 03:28:31,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +26: [2023-05-13 03:28:31,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 9: [2023-05-13 03:28:31,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 9: [2023-05-13 03:28:31,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 9: [2023-05-13 03:28:31,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 9: [2023-05-13 03:28:31,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 7: [2023-05-13 03:28:31,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:31,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +13: [2023-05-13 03:28:31,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 7: [2023-05-13 03:28:31,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 7: [2023-05-13 03:28:31,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 9: [2023-05-13 03:28:31,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:31,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +14: [2023-05-13 03:28:31,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +13: [2023-05-13 03:28:31,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +19: [2023-05-13 03:28:31,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 7: [2023-05-13 03:28:31,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +19: [2023-05-13 03:28:31,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +12: [2023-05-13 03:28:31,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +12: [2023-05-13 03:28:31,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +25: [2023-05-13 03:28:31,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +11: [2023-05-13 03:28:31,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +21: [2023-05-13 03:28:31,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +13: [2023-05-13 03:28:31,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +13: [2023-05-13 03:28:31,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +13: [2023-05-13 03:28:31,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +13: [2023-05-13 03:28:31,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:31,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +21: [2023-05-13 03:28:31,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +13: [2023-05-13 03:28:31,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +21: [2023-05-13 03:28:31,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +19: [2023-05-13 03:28:31,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +19: [2023-05-13 03:28:31,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +19: [2023-05-13 03:28:31,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +21: [2023-05-13 03:28:31,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:31,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:31,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +31: [2023-05-13 03:28:31,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 9: [2023-05-13 03:28:31,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 7: [2023-05-13 03:28:31,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +25: [2023-05-13 03:28:31,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +25: [2023-05-13 03:28:31,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +31: [2023-05-13 03:28:31,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +30: [2023-05-13 03:28:31,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +30: [2023-05-13 03:28:31,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +30: [2023-05-13 03:28:31,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 2: [2023-05-13 03:28:31,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 2: [2023-05-13 03:28:31,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 2: [2023-05-13 03:28:31,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +25: [2023-05-13 03:28:31,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +21: [2023-05-13 03:28:31,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 2: [2023-05-13 03:28:31,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +30: [2023-05-13 03:28:31,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +24: [2023-05-13 03:28:31,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +29: [2023-05-13 03:28:31,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +29: [2023-05-13 03:28:31,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +21: [2023-05-13 03:28:31,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +21: [2023-05-13 03:28:31,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +21: [2023-05-13 03:28:31,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 6: [2023-05-13 03:28:31,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +31: [2023-05-13 03:28:31,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +31: [2023-05-13 03:28:31,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +31: [2023-05-13 03:28:31,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +17: [2023-05-13 03:28:31,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +29: [2023-05-13 03:28:31,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +14: [2023-05-13 03:28:31,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +29: [2023-05-13 03:28:31,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +29: [2023-05-13 03:28:31,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +29: [2023-05-13 03:28:31,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +29: [2023-05-13 03:28:31,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +31: [2023-05-13 03:28:31,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +31: [2023-05-13 03:28:31,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +31: [2023-05-13 03:28:31,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +26: [2023-05-13 03:28:31,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 9: [2023-05-13 03:28:31,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 9: [2023-05-13 03:28:31,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 9: [2023-05-13 03:28:31,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +30: [2023-05-13 03:28:31,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 9: [2023-05-13 03:28:31,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 7: [2023-05-13 03:28:31,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 9: [2023-05-13 03:28:31,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... +12: [2023-05-13 03:28:31,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +12: [2023-05-13 03:28:31,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +12: [2023-05-13 03:28:31,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +12: [2023-05-13 03:28:31,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +12: [2023-05-13 03:28:31,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +26: [2023-05-13 03:28:31,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 1: [2023-05-13 03:28:31,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 9: [2023-05-13 03:28:31,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 1: [2023-05-13 03:28:31,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +14: [2023-05-13 03:28:31,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 9: [2023-05-13 03:28:31,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt... + 6: [2023-05-13 03:28:31,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +14: [2023-05-13 03:28:31,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +25: [2023-05-13 03:28:31,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +14: [2023-05-13 03:28:31,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +14: [2023-05-13 03:28:31,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:31,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:31,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:31,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +25: [2023-05-13 03:28:31,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +11: [2023-05-13 03:28:31,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +11: [2023-05-13 03:28:31,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +11: [2023-05-13 03:28:31,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +25: [2023-05-13 03:28:31,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 6: [2023-05-13 03:28:31,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +30: [2023-05-13 03:28:31,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +30: [2023-05-13 03:28:31,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 6: [2023-05-13 03:28:31,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 6: [2023-05-13 03:28:31,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 6: [2023-05-13 03:28:31,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 6: [2023-05-13 03:28:31,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 6: [2023-05-13 03:28:31,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +30: [2023-05-13 03:28:31,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +12: [2023-05-13 03:28:31,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 7: [2023-05-13 03:28:31,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +25: [2023-05-13 03:28:31,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +12: [2023-05-13 03:28:31,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +26: [2023-05-13 03:28:31,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +26: [2023-05-13 03:28:31,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +26: [2023-05-13 03:28:31,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 1: [2023-05-13 03:28:31,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +11: [2023-05-13 03:28:31,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +11: [2023-05-13 03:28:31,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +11: [2023-05-13 03:28:31,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +11: [2023-05-13 03:28:31,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +10: [2023-05-13 03:28:31,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +10: [2023-05-13 03:28:31,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +19: [2023-05-13 03:28:31,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +19: [2023-05-13 03:28:31,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 1: [2023-05-13 03:28:31,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +17: [2023-05-13 03:28:31,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +17: [2023-05-13 03:28:31,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +17: [2023-05-13 03:28:31,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +17: [2023-05-13 03:28:31,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +17: [2023-05-13 03:28:31,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +17: [2023-05-13 03:28:31,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +17: [2023-05-13 03:28:31,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 1: [2023-05-13 03:28:31,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +19: [2023-05-13 03:28:31,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 7: [2023-05-13 03:28:31,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 7: [2023-05-13 03:28:31,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 1: [2023-05-13 03:28:31,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +27: [2023-05-13 03:28:31,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +12: [2023-05-13 03:28:31,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +27: [2023-05-13 03:28:31,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +27: [2023-05-13 03:28:31,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +27: [2023-05-13 03:28:31,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +27: [2023-05-13 03:28:31,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +27: [2023-05-13 03:28:31,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +27: [2023-05-13 03:28:31,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +27: [2023-05-13 03:28:31,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 1: [2023-05-13 03:28:31,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 1: [2023-05-13 03:28:31,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +30: [2023-05-13 03:28:31,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 7: [2023-05-13 03:28:31,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +19: [2023-05-13 03:28:31,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +26: [2023-05-13 03:28:31,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +26: [2023-05-13 03:28:31,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +30: [2023-05-13 03:28:31,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +30: [2023-05-13 03:28:31,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 7: [2023-05-13 03:28:31,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 7: [2023-05-13 03:28:31,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +27: [2023-05-13 03:28:31,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +19: [2023-05-13 03:28:31,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +30: [2023-05-13 03:28:31,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 8: [2023-05-13 03:28:31,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +19: [2023-05-13 03:28:31,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 8: [2023-05-13 03:28:31,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +31: [2023-05-13 03:28:31,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 8: [2023-05-13 03:28:31,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 8: [2023-05-13 03:28:31,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 8: [2023-05-13 03:28:31,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +19: [2023-05-13 03:28:31,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +19: [2023-05-13 03:28:31,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +31: [2023-05-13 03:28:31,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +27: [2023-05-13 03:28:31,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +31: [2023-05-13 03:28:31,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +27: [2023-05-13 03:28:31,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +27: [2023-05-13 03:28:31,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +29: [2023-05-13 03:28:31,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +27: [2023-05-13 03:28:31,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +27: [2023-05-13 03:28:31,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +31: [2023-05-13 03:28:31,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +12: [2023-05-13 03:28:31,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +12: [2023-05-13 03:28:31,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 6: [2023-05-13 03:28:31,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +12: [2023-05-13 03:28:31,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +29: [2023-05-13 03:28:31,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +27: [2023-05-13 03:28:31,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +27: [2023-05-13 03:28:31,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +31: [2023-05-13 03:28:31,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +10: [2023-05-13 03:28:31,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +29: [2023-05-13 03:28:31,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +31: [2023-05-13 03:28:31,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +12: [2023-05-13 03:28:31,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +30: [2023-05-13 03:28:31,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +10: [2023-05-13 03:28:31,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +10: [2023-05-13 03:28:31,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 2: [2023-05-13 03:28:31,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +29: [2023-05-13 03:28:31,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +29: [2023-05-13 03:28:31,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +29: [2023-05-13 03:28:31,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 8: [2023-05-13 03:28:31,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +30: [2023-05-13 03:28:31,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +21: [2023-05-13 03:28:31,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +12: [2023-05-13 03:28:31,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +30: [2023-05-13 03:28:31,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +10: [2023-05-13 03:28:31,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +10: [2023-05-13 03:28:31,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +10: [2023-05-13 03:28:31,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +10: [2023-05-13 03:28:31,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +10: [2023-05-13 03:28:31,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +30: [2023-05-13 03:28:31,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 9: [2023-05-13 03:28:31,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 6: [2023-05-13 03:28:31,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +13: [2023-05-13 03:28:31,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +13: [2023-05-13 03:28:31,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 6: [2023-05-13 03:28:31,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 6: [2023-05-13 03:28:31,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +13: [2023-05-13 03:28:31,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 6: [2023-05-13 03:28:31,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +11: [2023-05-13 03:28:31,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 6: [2023-05-13 03:28:31,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +11: [2023-05-13 03:28:31,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +21: [2023-05-13 03:28:31,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +21: [2023-05-13 03:28:31,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +11: [2023-05-13 03:28:31,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +21: [2023-05-13 03:28:31,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +17: [2023-05-13 03:28:31,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +17: [2023-05-13 03:28:31,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +11: [2023-05-13 03:28:31,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +21: [2023-05-13 03:28:31,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +11: [2023-05-13 03:28:31,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +17: [2023-05-13 03:28:31,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +11: [2023-05-13 03:28:31,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +11: [2023-05-13 03:28:31,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +17: [2023-05-13 03:28:31,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +17: [2023-05-13 03:28:31,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +13: [2023-05-13 03:28:31,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +13: [2023-05-13 03:28:31,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +13: [2023-05-13 03:28:31,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +13: [2023-05-13 03:28:31,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +13: [2023-05-13 03:28:31,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +17: [2023-05-13 03:28:31,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +17: [2023-05-13 03:28:31,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +21: [2023-05-13 03:28:31,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +10: [2023-05-13 03:28:31,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 9: [2023-05-13 03:28:31,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 5: [2023-05-13 03:28:31,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +13: [2023-05-13 03:28:31,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +13: [2023-05-13 03:28:31,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +10: [2023-05-13 03:28:31,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +21: [2023-05-13 03:28:31,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +21: [2023-05-13 03:28:31,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +21: [2023-05-13 03:28:31,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +10: [2023-05-13 03:28:31,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:31,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 5: [2023-05-13 03:28:31,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +21: [2023-05-13 03:28:32,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 5: [2023-05-13 03:28:32,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 5: [2023-05-13 03:28:32,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +10: [2023-05-13 03:28:32,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +10: [2023-05-13 03:28:32,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +10: [2023-05-13 03:28:32,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +21: [2023-05-13 03:28:32,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +27: [2023-05-13 03:28:32,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:32,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +21: [2023-05-13 03:28:32,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +21: [2023-05-13 03:28:32,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_23-model_00-model_states.pt. +13: [2023-05-13 03:28:32,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +13: [2023-05-13 03:28:32,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +13: [2023-05-13 03:28:32,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +13: [2023-05-13 03:28:32,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +13: [2023-05-13 03:28:32,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +21: [2023-05-13 03:28:32,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +27: [2023-05-13 03:28:32,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +21: [2023-05-13 03:28:32,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +21: [2023-05-13 03:28:32,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +27: [2023-05-13 03:28:32,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +27: [2023-05-13 03:28:32,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 8: [2023-05-13 03:28:32,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 8: [2023-05-13 03:28:32,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 8: [2023-05-13 03:28:32,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 8: [2023-05-13 03:28:32,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 8: [2023-05-13 03:28:32,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 8: [2023-05-13 03:28:32,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +27: [2023-05-13 03:28:32,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +27: [2023-05-13 03:28:32,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +27: [2023-05-13 03:28:32,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +27: [2023-05-13 03:28:32,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +27: [2023-05-13 03:28:32,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +27: [2023-05-13 03:28:32,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +27: [2023-05-13 03:28:32,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +27: [2023-05-13 03:28:32,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +27: [2023-05-13 03:28:32,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +27: [2023-05-13 03:28:32,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +27: [2023-05-13 03:28:32,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +27: [2023-05-13 03:28:32,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +28: [2023-05-13 03:28:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +28: [2023-05-13 03:28:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +28: [2023-05-13 03:28:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +28: [2023-05-13 03:28:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +16: [2023-05-13 03:28:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +16: [2023-05-13 03:28:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +16: [2023-05-13 03:28:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +16: [2023-05-13 03:28:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +16: [2023-05-13 03:28:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +28: [2023-05-13 03:28:32,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +28: [2023-05-13 03:28:32,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +28: [2023-05-13 03:28:32,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +16: [2023-05-13 03:28:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +16: [2023-05-13 03:28:32,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +16: [2023-05-13 03:28:32,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +28: [2023-05-13 03:28:32,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +20: [2023-05-13 03:28:32,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +20: [2023-05-13 03:28:32,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +20: [2023-05-13 03:28:32,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +20: [2023-05-13 03:28:32,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +20: [2023-05-13 03:28:32,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +20: [2023-05-13 03:28:32,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +20: [2023-05-13 03:28:32,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +20: [2023-05-13 03:28:32,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +28: [2023-05-13 03:28:32,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +16: [2023-05-13 03:28:32,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +16: [2023-05-13 03:28:32,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +20: [2023-05-13 03:28:32,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +20: [2023-05-13 03:28:32,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +16: [2023-05-13 03:28:32,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +16: [2023-05-13 03:28:32,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +16: [2023-05-13 03:28:32,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +16: [2023-05-13 03:28:32,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +16: [2023-05-13 03:28:32,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +28: [2023-05-13 03:28:32,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +16: [2023-05-13 03:28:32,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +20: [2023-05-13 03:28:32,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +20: [2023-05-13 03:28:32,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +20: [2023-05-13 03:28:32,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +20: [2023-05-13 03:28:32,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +28: [2023-05-13 03:28:32,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +28: [2023-05-13 03:28:32,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +28: [2023-05-13 03:28:32,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +20: [2023-05-13 03:28:32,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +20: [2023-05-13 03:28:32,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +28: [2023-05-13 03:28:32,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +28: [2023-05-13 03:28:32,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +28: [2023-05-13 03:28:32,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +23: [2023-05-13 03:28:32,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +23: [2023-05-13 03:28:32,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +23: [2023-05-13 03:28:32,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +23: [2023-05-13 03:28:32,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +23: [2023-05-13 03:28:32,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +23: [2023-05-13 03:28:32,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +23: [2023-05-13 03:28:32,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +23: [2023-05-13 03:28:32,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +22: [2023-05-13 03:28:32,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +22: [2023-05-13 03:28:32,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +22: [2023-05-13 03:28:32,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +22: [2023-05-13 03:28:32,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +15: [2023-05-13 03:28:32,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +22: [2023-05-13 03:28:32,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +22: [2023-05-13 03:28:32,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +22: [2023-05-13 03:28:32,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +22: [2023-05-13 03:28:32,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +15: [2023-05-13 03:28:32,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +15: [2023-05-13 03:28:32,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +15: [2023-05-13 03:28:32,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +15: [2023-05-13 03:28:32,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +15: [2023-05-13 03:28:32,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +15: [2023-05-13 03:28:32,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +15: [2023-05-13 03:28:32,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +23: [2023-05-13 03:28:32,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +23: [2023-05-13 03:28:32,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +15: [2023-05-13 03:28:32,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +23: [2023-05-13 03:28:32,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +22: [2023-05-13 03:28:32,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +22: [2023-05-13 03:28:32,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +23: [2023-05-13 03:28:32,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +23: [2023-05-13 03:28:32,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +23: [2023-05-13 03:28:32,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +22: [2023-05-13 03:28:32,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +22: [2023-05-13 03:28:32,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +23: [2023-05-13 03:28:32,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +23: [2023-05-13 03:28:32,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +22: [2023-05-13 03:28:32,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +22: [2023-05-13 03:28:32,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +22: [2023-05-13 03:28:32,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +22: [2023-05-13 03:28:32,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +15: [2023-05-13 03:28:32,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +15: [2023-05-13 03:28:32,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +15: [2023-05-13 03:28:32,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +15: [2023-05-13 03:28:32,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +15: [2023-05-13 03:28:32,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +15: [2023-05-13 03:28:32,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +15: [2023-05-13 03:28:32,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +28: [2023-05-13 03:28:32,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +16: [2023-05-13 03:28:32,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +20: [2023-05-13 03:28:32,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +20: [2023-05-13 03:28:32,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +16: [2023-05-13 03:28:32,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +28: [2023-05-13 03:28:32,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +16: [2023-05-13 03:28:32,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +16: [2023-05-13 03:28:32,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +16: [2023-05-13 03:28:32,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +16: [2023-05-13 03:28:32,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +28: [2023-05-13 03:28:32,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +16: [2023-05-13 03:28:32,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +16: [2023-05-13 03:28:32,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +16: [2023-05-13 03:28:32,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +20: [2023-05-13 03:28:32,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +15: [2023-05-13 03:28:32,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +20: [2023-05-13 03:28:32,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +20: [2023-05-13 03:28:32,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +20: [2023-05-13 03:28:32,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +20: [2023-05-13 03:28:32,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +20: [2023-05-13 03:28:32,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +20: [2023-05-13 03:28:32,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +23: [2023-05-13 03:28:32,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +23: [2023-05-13 03:28:32,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +22: [2023-05-13 03:28:32,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +22: [2023-05-13 03:28:32,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +20: [2023-05-13 03:28:32,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +28: [2023-05-13 03:28:32,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +28: [2023-05-13 03:28:32,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +23: [2023-05-13 03:28:32,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +16: [2023-05-13 03:28:32,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +28: [2023-05-13 03:28:32,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +28: [2023-05-13 03:28:32,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +28: [2023-05-13 03:28:32,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +28: [2023-05-13 03:28:32,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +16: [2023-05-13 03:28:32,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +16: [2023-05-13 03:28:32,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +16: [2023-05-13 03:28:32,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +16: [2023-05-13 03:28:32,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +26: [2023-05-13 03:28:32,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +26: [2023-05-13 03:28:32,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +26: [2023-05-13 03:28:32,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +16: [2023-05-13 03:28:32,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +16: [2023-05-13 03:28:32,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +26: [2023-05-13 03:28:32,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +26: [2023-05-13 03:28:32,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +26: [2023-05-13 03:28:32,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +26: [2023-05-13 03:28:32,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +26: [2023-05-13 03:28:32,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +20: [2023-05-13 03:28:32,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +18: [2023-05-13 03:28:32,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +18: [2023-05-13 03:28:32,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +18: [2023-05-13 03:28:32,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +18: [2023-05-13 03:28:32,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +18: [2023-05-13 03:28:32,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +18: [2023-05-13 03:28:32,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +18: [2023-05-13 03:28:32,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +18: [2023-05-13 03:28:32,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +15: [2023-05-13 03:28:32,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +26: [2023-05-13 03:28:32,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +26: [2023-05-13 03:28:32,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +26: [2023-05-13 03:28:32,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +22: [2023-05-13 03:28:32,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +22: [2023-05-13 03:28:32,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +26: [2023-05-13 03:28:32,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +26: [2023-05-13 03:28:32,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +18: [2023-05-13 03:28:32,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +18: [2023-05-13 03:28:32,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +18: [2023-05-13 03:28:32,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +26: [2023-05-13 03:28:32,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +18: [2023-05-13 03:28:32,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +23: [2023-05-13 03:28:32,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +26: [2023-05-13 03:28:32,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +26: [2023-05-13 03:28:32,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +18: [2023-05-13 03:28:32,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +22: [2023-05-13 03:28:32,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +22: [2023-05-13 03:28:32,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +22: [2023-05-13 03:28:32,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +18: [2023-05-13 03:28:32,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +18: [2023-05-13 03:28:32,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +18: [2023-05-13 03:28:32,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +23: [2023-05-13 03:28:32,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +20: [2023-05-13 03:28:32,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +22: [2023-05-13 03:28:32,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +23: [2023-05-13 03:28:32,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +23: [2023-05-13 03:28:32,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +23: [2023-05-13 03:28:32,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +23: [2023-05-13 03:28:32,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +23: [2023-05-13 03:28:32,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +22: [2023-05-13 03:28:32,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +22: [2023-05-13 03:28:32,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +20: [2023-05-13 03:28:32,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +23: [2023-05-13 03:28:32,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +20: [2023-05-13 03:28:32,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +20: [2023-05-13 03:28:32,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +20: [2023-05-13 03:28:32,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +15: [2023-05-13 03:28:32,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +15: [2023-05-13 03:28:32,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +15: [2023-05-13 03:28:32,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +15: [2023-05-13 03:28:32,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +15: [2023-05-13 03:28:32,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +15: [2023-05-13 03:28:32,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +15: [2023-05-13 03:28:32,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:32,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +24: [2023-05-13 03:28:32,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +24: [2023-05-13 03:28:32,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +24: [2023-05-13 03:28:32,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +24: [2023-05-13 03:28:32,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +24: [2023-05-13 03:28:32,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +24: [2023-05-13 03:28:32,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +24: [2023-05-13 03:28:32,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:32,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:32,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:32,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:32,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:32,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:32,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:32,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:32,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +14: [2023-05-13 03:28:32,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +14: [2023-05-13 03:28:32,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +22: [2023-05-13 03:28:32,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +14: [2023-05-13 03:28:32,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +14: [2023-05-13 03:28:32,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +14: [2023-05-13 03:28:32,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +14: [2023-05-13 03:28:32,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +14: [2023-05-13 03:28:32,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +14: [2023-05-13 03:28:32,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +28: [2023-05-13 03:28:32,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +28: [2023-05-13 03:28:32,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +28: [2023-05-13 03:28:32,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +28: [2023-05-13 03:28:32,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +28: [2023-05-13 03:28:32,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +28: [2023-05-13 03:28:32,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +28: [2023-05-13 03:28:32,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +22: [2023-05-13 03:28:32,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +14: [2023-05-13 03:28:32,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +22: [2023-05-13 03:28:32,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +14: [2023-05-13 03:28:32,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +14: [2023-05-13 03:28:32,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +14: [2023-05-13 03:28:32,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +14: [2023-05-13 03:28:32,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +23: [2023-05-13 03:28:32,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +30: [2023-05-13 03:28:32,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +30: [2023-05-13 03:28:32,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +30: [2023-05-13 03:28:32,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +30: [2023-05-13 03:28:32,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +30: [2023-05-13 03:28:32,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +14: [2023-05-13 03:28:32,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +23: [2023-05-13 03:28:32,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +30: [2023-05-13 03:28:32,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +30: [2023-05-13 03:28:32,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +14: [2023-05-13 03:28:32,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +30: [2023-05-13 03:28:32,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +23: [2023-05-13 03:28:32,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +14: [2023-05-13 03:28:32,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +22: [2023-05-13 03:28:32,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +22: [2023-05-13 03:28:32,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +22: [2023-05-13 03:28:32,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +23: [2023-05-13 03:28:32,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +23: [2023-05-13 03:28:32,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +30: [2023-05-13 03:28:32,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +30: [2023-05-13 03:28:32,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +30: [2023-05-13 03:28:32,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +30: [2023-05-13 03:28:32,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +30: [2023-05-13 03:28:32,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +30: [2023-05-13 03:28:32,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +30: [2023-05-13 03:28:32,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +30: [2023-05-13 03:28:32,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +15: [2023-05-13 03:28:32,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +15: [2023-05-13 03:28:32,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +26: [2023-05-13 03:28:32,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +26: [2023-05-13 03:28:32,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +26: [2023-05-13 03:28:32,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +15: [2023-05-13 03:28:32,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +26: [2023-05-13 03:28:32,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +15: [2023-05-13 03:28:32,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +15: [2023-05-13 03:28:32,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +15: [2023-05-13 03:28:32,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +15: [2023-05-13 03:28:32,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +18: [2023-05-13 03:28:32,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +18: [2023-05-13 03:28:32,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +18: [2023-05-13 03:28:32,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +18: [2023-05-13 03:28:32,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +31: [2023-05-13 03:28:32,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +31: [2023-05-13 03:28:32,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +11: [2023-05-13 03:28:32,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +11: [2023-05-13 03:28:32,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +11: [2023-05-13 03:28:32,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +31: [2023-05-13 03:28:32,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +31: [2023-05-13 03:28:32,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +31: [2023-05-13 03:28:32,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +31: [2023-05-13 03:28:32,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +31: [2023-05-13 03:28:32,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +11: [2023-05-13 03:28:32,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +11: [2023-05-13 03:28:32,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +11: [2023-05-13 03:28:32,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +11: [2023-05-13 03:28:32,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +31: [2023-05-13 03:28:32,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +11: [2023-05-13 03:28:32,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +11: [2023-05-13 03:28:32,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +31: [2023-05-13 03:28:32,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +31: [2023-05-13 03:28:32,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +18: [2023-05-13 03:28:32,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +26: [2023-05-13 03:28:32,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +31: [2023-05-13 03:28:32,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +26: [2023-05-13 03:28:32,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +31: [2023-05-13 03:28:32,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +26: [2023-05-13 03:28:32,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +31: [2023-05-13 03:28:32,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +26: [2023-05-13 03:28:32,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +31: [2023-05-13 03:28:32,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +31: [2023-05-13 03:28:32,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +11: [2023-05-13 03:28:32,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +11: [2023-05-13 03:28:32,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +31: [2023-05-13 03:28:32,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +11: [2023-05-13 03:28:32,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +18: [2023-05-13 03:28:32,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +18: [2023-05-13 03:28:32,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +18: [2023-05-13 03:28:32,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +11: [2023-05-13 03:28:32,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +11: [2023-05-13 03:28:32,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +11: [2023-05-13 03:28:32,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +11: [2023-05-13 03:28:32,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:32,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +24: [2023-05-13 03:28:32,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +19: [2023-05-13 03:28:32,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +19: [2023-05-13 03:28:32,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +26: [2023-05-13 03:28:32,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +26: [2023-05-13 03:28:32,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +26: [2023-05-13 03:28:32,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +26: [2023-05-13 03:28:32,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +19: [2023-05-13 03:28:32,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +19: [2023-05-13 03:28:32,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +19: [2023-05-13 03:28:32,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +19: [2023-05-13 03:28:32,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +19: [2023-05-13 03:28:32,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +19: [2023-05-13 03:28:32,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +18: [2023-05-13 03:28:32,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +18: [2023-05-13 03:28:32,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:32,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +18: [2023-05-13 03:28:32,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +18: [2023-05-13 03:28:32,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +19: [2023-05-13 03:28:32,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +19: [2023-05-13 03:28:32,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +19: [2023-05-13 03:28:32,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +19: [2023-05-13 03:28:32,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +19: [2023-05-13 03:28:32,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +19: [2023-05-13 03:28:32,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +19: [2023-05-13 03:28:32,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +19: [2023-05-13 03:28:32,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +14: [2023-05-13 03:28:32,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +24: [2023-05-13 03:28:32,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +24: [2023-05-13 03:28:32,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +24: [2023-05-13 03:28:32,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +14: [2023-05-13 03:28:32,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +24: [2023-05-13 03:28:32,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +14: [2023-05-13 03:28:32,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +24: [2023-05-13 03:28:32,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +14: [2023-05-13 03:28:32,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +17: [2023-05-13 03:28:32,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +17: [2023-05-13 03:28:32,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +17: [2023-05-13 03:28:32,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +17: [2023-05-13 03:28:32,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +17: [2023-05-13 03:28:32,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +17: [2023-05-13 03:28:32,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +17: [2023-05-13 03:28:32,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +17: [2023-05-13 03:28:32,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +30: [2023-05-13 03:28:32,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +30: [2023-05-13 03:28:32,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +17: [2023-05-13 03:28:32,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +18: [2023-05-13 03:28:32,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +18: [2023-05-13 03:28:32,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +30: [2023-05-13 03:28:32,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +18: [2023-05-13 03:28:32,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +26: [2023-05-13 03:28:32,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +18: [2023-05-13 03:28:32,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +26: [2023-05-13 03:28:32,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +25: [2023-05-13 03:28:32,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +25: [2023-05-13 03:28:32,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +14: [2023-05-13 03:28:32,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +25: [2023-05-13 03:28:32,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +25: [2023-05-13 03:28:32,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +25: [2023-05-13 03:28:32,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +25: [2023-05-13 03:28:32,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +25: [2023-05-13 03:28:32,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +25: [2023-05-13 03:28:32,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +24: [2023-05-13 03:28:32,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +24: [2023-05-13 03:28:32,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +30: [2023-05-13 03:28:32,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +26: [2023-05-13 03:28:32,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +14: [2023-05-13 03:28:32,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +14: [2023-05-13 03:28:32,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +14: [2023-05-13 03:28:32,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +17: [2023-05-13 03:28:32,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +17: [2023-05-13 03:28:32,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +25: [2023-05-13 03:28:32,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +26: [2023-05-13 03:28:32,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +17: [2023-05-13 03:28:32,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +17: [2023-05-13 03:28:32,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +25: [2023-05-13 03:28:32,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +17: [2023-05-13 03:28:32,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +25: [2023-05-13 03:28:32,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +25: [2023-05-13 03:28:32,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +25: [2023-05-13 03:28:32,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +17: [2023-05-13 03:28:32,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +17: [2023-05-13 03:28:32,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +30: [2023-05-13 03:28:32,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +30: [2023-05-13 03:28:32,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +11: [2023-05-13 03:28:32,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +30: [2023-05-13 03:28:32,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +30: [2023-05-13 03:28:32,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +25: [2023-05-13 03:28:32,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +25: [2023-05-13 03:28:32,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:32,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +25: [2023-05-13 03:28:32,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +31: [2023-05-13 03:28:32,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +31: [2023-05-13 03:28:32,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +14: [2023-05-13 03:28:32,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +14: [2023-05-13 03:28:32,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +14: [2023-05-13 03:28:32,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +24: [2023-05-13 03:28:32,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +14: [2023-05-13 03:28:32,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +30: [2023-05-13 03:28:32,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +30: [2023-05-13 03:28:32,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +24: [2023-05-13 03:28:32,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +24: [2023-05-13 03:28:32,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +12: [2023-05-13 03:28:32,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +12: [2023-05-13 03:28:32,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +12: [2023-05-13 03:28:32,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +12: [2023-05-13 03:28:32,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +12: [2023-05-13 03:28:32,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +12: [2023-05-13 03:28:32,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +12: [2023-05-13 03:28:32,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +12: [2023-05-13 03:28:32,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +24: [2023-05-13 03:28:32,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +11: [2023-05-13 03:28:32,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +30: [2023-05-13 03:28:32,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +24: [2023-05-13 03:28:32,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +30: [2023-05-13 03:28:32,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +12: [2023-05-13 03:28:32,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +12: [2023-05-13 03:28:32,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +12: [2023-05-13 03:28:32,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +12: [2023-05-13 03:28:32,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +19: [2023-05-13 03:28:32,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +12: [2023-05-13 03:28:32,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +12: [2023-05-13 03:28:32,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +12: [2023-05-13 03:28:32,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +31: [2023-05-13 03:28:32,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +12: [2023-05-13 03:28:32,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +31: [2023-05-13 03:28:32,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +14: [2023-05-13 03:28:32,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +14: [2023-05-13 03:28:32,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +14: [2023-05-13 03:28:32,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +14: [2023-05-13 03:28:32,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +30: [2023-05-13 03:28:32,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +17: [2023-05-13 03:28:32,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +19: [2023-05-13 03:28:32,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +30: [2023-05-13 03:28:32,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +30: [2023-05-13 03:28:32,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +30: [2023-05-13 03:28:32,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +31: [2023-05-13 03:28:32,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +31: [2023-05-13 03:28:32,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +31: [2023-05-13 03:28:32,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +31: [2023-05-13 03:28:32,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +31: [2023-05-13 03:28:32,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +31: [2023-05-13 03:28:32,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +11: [2023-05-13 03:28:32,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +19: [2023-05-13 03:28:32,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +19: [2023-05-13 03:28:32,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +11: [2023-05-13 03:28:32,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +11: [2023-05-13 03:28:32,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +11: [2023-05-13 03:28:32,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +11: [2023-05-13 03:28:32,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +11: [2023-05-13 03:28:32,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +11: [2023-05-13 03:28:32,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +25: [2023-05-13 03:28:32,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 5: [2023-05-13 03:28:32,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 5: [2023-05-13 03:28:32,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 5: [2023-05-13 03:28:32,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 5: [2023-05-13 03:28:32,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 5: [2023-05-13 03:28:32,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 5: [2023-05-13 03:28:32,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 5: [2023-05-13 03:28:32,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 5: [2023-05-13 03:28:32,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +19: [2023-05-13 03:28:32,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +17: [2023-05-13 03:28:32,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +29: [2023-05-13 03:28:32,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +29: [2023-05-13 03:28:32,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +19: [2023-05-13 03:28:32,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +19: [2023-05-13 03:28:32,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +19: [2023-05-13 03:28:32,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +19: [2023-05-13 03:28:32,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 5: [2023-05-13 03:28:32,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 5: [2023-05-13 03:28:32,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 5: [2023-05-13 03:28:32,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 5: [2023-05-13 03:28:32,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +29: [2023-05-13 03:28:32,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +29: [2023-05-13 03:28:32,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 5: [2023-05-13 03:28:32,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +29: [2023-05-13 03:28:32,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +29: [2023-05-13 03:28:32,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +29: [2023-05-13 03:28:32,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +29: [2023-05-13 03:28:32,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +29: [2023-05-13 03:28:32,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +29: [2023-05-13 03:28:32,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +19: [2023-05-13 03:28:32,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 5: [2023-05-13 03:28:32,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +11: [2023-05-13 03:28:32,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 5: [2023-05-13 03:28:32,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 5: [2023-05-13 03:28:32,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +25: [2023-05-13 03:28:32,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +25: [2023-05-13 03:28:32,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +31: [2023-05-13 03:28:32,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +19: [2023-05-13 03:28:32,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +19: [2023-05-13 03:28:32,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +29: [2023-05-13 03:28:32,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +29: [2023-05-13 03:28:32,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +13: [2023-05-13 03:28:32,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +13: [2023-05-13 03:28:32,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +13: [2023-05-13 03:28:32,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +29: [2023-05-13 03:28:32,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +13: [2023-05-13 03:28:32,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +13: [2023-05-13 03:28:32,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +13: [2023-05-13 03:28:32,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +13: [2023-05-13 03:28:32,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +31: [2023-05-13 03:28:32,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +25: [2023-05-13 03:28:32,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +13: [2023-05-13 03:28:32,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +29: [2023-05-13 03:28:32,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +31: [2023-05-13 03:28:32,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +29: [2023-05-13 03:28:32,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +31: [2023-05-13 03:28:32,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +25: [2023-05-13 03:28:32,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +25: [2023-05-13 03:28:32,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +25: [2023-05-13 03:28:32,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +25: [2023-05-13 03:28:32,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +31: [2023-05-13 03:28:32,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +29: [2023-05-13 03:28:32,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +31: [2023-05-13 03:28:32,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 8: [2023-05-13 03:28:32,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +17: [2023-05-13 03:28:32,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +25: [2023-05-13 03:28:32,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 8: [2023-05-13 03:28:32,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 8: [2023-05-13 03:28:32,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 8: [2023-05-13 03:28:32,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 8: [2023-05-13 03:28:32,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +12: [2023-05-13 03:28:32,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 8: [2023-05-13 03:28:32,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +11: [2023-05-13 03:28:32,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +13: [2023-05-13 03:28:32,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +13: [2023-05-13 03:28:32,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +13: [2023-05-13 03:28:32,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +11: [2023-05-13 03:28:32,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +13: [2023-05-13 03:28:32,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +13: [2023-05-13 03:28:32,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +13: [2023-05-13 03:28:32,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +11: [2023-05-13 03:28:32,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +13: [2023-05-13 03:28:32,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +10: [2023-05-13 03:28:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +10: [2023-05-13 03:28:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +10: [2023-05-13 03:28:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +10: [2023-05-13 03:28:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +10: [2023-05-13 03:28:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +10: [2023-05-13 03:28:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +10: [2023-05-13 03:28:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +10: [2023-05-13 03:28:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +13: [2023-05-13 03:28:32,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +27: [2023-05-13 03:28:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +27: [2023-05-13 03:28:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +27: [2023-05-13 03:28:32,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +27: [2023-05-13 03:28:32,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +27: [2023-05-13 03:28:32,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +27: [2023-05-13 03:28:32,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +27: [2023-05-13 03:28:32,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +27: [2023-05-13 03:28:32,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +11: [2023-05-13 03:28:32,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +10: [2023-05-13 03:28:32,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +11: [2023-05-13 03:28:32,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +17: [2023-05-13 03:28:32,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +17: [2023-05-13 03:28:32,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +17: [2023-05-13 03:28:32,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +10: [2023-05-13 03:28:32,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +27: [2023-05-13 03:28:32,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +11: [2023-05-13 03:28:32,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +12: [2023-05-13 03:28:32,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 8: [2023-05-13 03:28:32,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +17: [2023-05-13 03:28:32,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +19: [2023-05-13 03:28:32,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +27: [2023-05-13 03:28:32,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +19: [2023-05-13 03:28:32,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +17: [2023-05-13 03:28:32,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +17: [2023-05-13 03:28:32,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +19: [2023-05-13 03:28:32,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +10: [2023-05-13 03:28:32,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +10: [2023-05-13 03:28:32,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +12: [2023-05-13 03:28:32,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +10: [2023-05-13 03:28:32,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +10: [2023-05-13 03:28:32,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +19: [2023-05-13 03:28:32,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +12: [2023-05-13 03:28:32,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +10: [2023-05-13 03:28:32,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +10: [2023-05-13 03:28:32,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +25: [2023-05-13 03:28:32,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +25: [2023-05-13 03:28:32,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +27: [2023-05-13 03:28:32,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +27: [2023-05-13 03:28:32,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +27: [2023-05-13 03:28:32,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +27: [2023-05-13 03:28:32,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +27: [2023-05-13 03:28:32,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +12: [2023-05-13 03:28:32,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +27: [2023-05-13 03:28:32,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +21: [2023-05-13 03:28:32,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +21: [2023-05-13 03:28:32,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +21: [2023-05-13 03:28:32,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +21: [2023-05-13 03:28:32,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +21: [2023-05-13 03:28:32,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +21: [2023-05-13 03:28:32,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +21: [2023-05-13 03:28:32,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +12: [2023-05-13 03:28:32,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +12: [2023-05-13 03:28:32,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +12: [2023-05-13 03:28:32,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +12: [2023-05-13 03:28:32,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +21: [2023-05-13 03:28:32,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +17: [2023-05-13 03:28:32,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +25: [2023-05-13 03:28:32,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +21: [2023-05-13 03:28:32,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +21: [2023-05-13 03:28:32,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +21: [2023-05-13 03:28:32,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +21: [2023-05-13 03:28:32,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +25: [2023-05-13 03:28:32,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +21: [2023-05-13 03:28:32,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 5: [2023-05-13 03:28:32,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +21: [2023-05-13 03:28:32,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +25: [2023-05-13 03:28:32,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +21: [2023-05-13 03:28:32,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +21: [2023-05-13 03:28:32,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +25: [2023-05-13 03:28:32,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt... +25: [2023-05-13 03:28:32,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +29: [2023-05-13 03:28:32,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +29: [2023-05-13 03:28:32,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +12: [2023-05-13 03:28:32,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +12: [2023-05-13 03:28:32,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +17: [2023-05-13 03:28:32,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +12: [2023-05-13 03:28:32,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +17: [2023-05-13 03:28:32,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 5: [2023-05-13 03:28:32,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 5: [2023-05-13 03:28:32,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 5: [2023-05-13 03:28:32,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 5: [2023-05-13 03:28:32,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +17: [2023-05-13 03:28:32,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +17: [2023-05-13 03:28:32,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +17: [2023-05-13 03:28:32,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +17: [2023-05-13 03:28:32,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +10: [2023-05-13 03:28:32,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 5: [2023-05-13 03:28:32,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +12: [2023-05-13 03:28:32,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 8: [2023-05-13 03:28:32,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +12: [2023-05-13 03:28:32,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +12: [2023-05-13 03:28:32,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +12: [2023-05-13 03:28:32,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 5: [2023-05-13 03:28:32,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 5: [2023-05-13 03:28:32,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 5: [2023-05-13 03:28:32,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:32,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +29: [2023-05-13 03:28:32,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +29: [2023-05-13 03:28:32,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +13: [2023-05-13 03:28:32,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +13: [2023-05-13 03:28:32,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +13: [2023-05-13 03:28:32,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +13: [2023-05-13 03:28:32,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +13: [2023-05-13 03:28:32,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +27: [2023-05-13 03:28:32,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +29: [2023-05-13 03:28:32,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +29: [2023-05-13 03:28:32,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +10: [2023-05-13 03:28:32,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 5: [2023-05-13 03:28:32,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 5: [2023-05-13 03:28:32,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +13: [2023-05-13 03:28:32,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +10: [2023-05-13 03:28:32,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 5: [2023-05-13 03:28:32,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +28: [2023-05-13 03:28:32,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +27: [2023-05-13 03:28:32,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +28: [2023-05-13 03:28:32,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +28: [2023-05-13 03:28:32,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +28: [2023-05-13 03:28:32,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +28: [2023-05-13 03:28:32,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +28: [2023-05-13 03:28:32,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +28: [2023-05-13 03:28:32,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +29: [2023-05-13 03:28:32,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +29: [2023-05-13 03:28:32,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +29: [2023-05-13 03:28:32,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +28: [2023-05-13 03:28:32,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 8: [2023-05-13 03:28:32,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 5: [2023-05-13 03:28:32,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 8: [2023-05-13 03:28:32,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +28: [2023-05-13 03:28:32,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +13: [2023-05-13 03:28:32,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +13: [2023-05-13 03:28:32,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 5: [2023-05-13 03:28:32,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:32,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +28: [2023-05-13 03:28:32,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 5: [2023-05-13 03:28:32,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 5: [2023-05-13 03:28:32,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +28: [2023-05-13 03:28:32,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +27: [2023-05-13 03:28:32,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +28: [2023-05-13 03:28:32,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +21: [2023-05-13 03:28:32,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +28: [2023-05-13 03:28:32,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +28: [2023-05-13 03:28:32,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 8: [2023-05-13 03:28:32,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 8: [2023-05-13 03:28:32,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +21: [2023-05-13 03:28:32,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +28: [2023-05-13 03:28:32,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +13: [2023-05-13 03:28:32,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +13: [2023-05-13 03:28:32,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +28: [2023-05-13 03:28:32,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +10: [2023-05-13 03:28:32,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 8: [2023-05-13 03:28:32,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +10: [2023-05-13 03:28:32,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +13: [2023-05-13 03:28:32,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +21: [2023-05-13 03:28:32,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +21: [2023-05-13 03:28:32,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +13: [2023-05-13 03:28:32,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +10: [2023-05-13 03:28:32,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +10: [2023-05-13 03:28:32,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +10: [2023-05-13 03:28:32,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +10: [2023-05-13 03:28:32,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +10: [2023-05-13 03:28:32,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +13: [2023-05-13 03:28:32,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +27: [2023-05-13 03:28:32,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +29: [2023-05-13 03:28:32,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +13: [2023-05-13 03:28:32,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +21: [2023-05-13 03:28:32,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +29: [2023-05-13 03:28:32,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +27: [2023-05-13 03:28:32,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:32,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +29: [2023-05-13 03:28:32,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +13: [2023-05-13 03:28:32,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +21: [2023-05-13 03:28:32,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +21: [2023-05-13 03:28:32,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +29: [2023-05-13 03:28:32,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +13: [2023-05-13 03:28:32,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +21: [2023-05-13 03:28:32,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +27: [2023-05-13 03:28:32,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +27: [2023-05-13 03:28:32,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +27: [2023-05-13 03:28:32,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +27: [2023-05-13 03:28:32,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +27: [2023-05-13 03:28:32,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +21: [2023-05-13 03:28:32,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. +21: [2023-05-13 03:28:32,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +21: [2023-05-13 03:28:32,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +21: [2023-05-13 03:28:32,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_24-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +10: [2023-05-13 03:28:32,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +10: [2023-05-13 03:28:32,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 8: [2023-05-13 03:28:32,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +10: [2023-05-13 03:28:32,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +10: [2023-05-13 03:28:32,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +10: [2023-05-13 03:28:32,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +10: [2023-05-13 03:28:32,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +28: [2023-05-13 03:28:32,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +27: [2023-05-13 03:28:32,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +21: [2023-05-13 03:28:32,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +21: [2023-05-13 03:28:32,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +20: [2023-05-13 03:28:32,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +20: [2023-05-13 03:28:32,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +21: [2023-05-13 03:28:32,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +21: [2023-05-13 03:28:32,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +20: [2023-05-13 03:28:32,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +20: [2023-05-13 03:28:32,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +20: [2023-05-13 03:28:32,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +20: [2023-05-13 03:28:32,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +20: [2023-05-13 03:28:32,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +20: [2023-05-13 03:28:32,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +20: [2023-05-13 03:28:32,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +20: [2023-05-13 03:28:32,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +27: [2023-05-13 03:28:32,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +27: [2023-05-13 03:28:32,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +28: [2023-05-13 03:28:32,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +27: [2023-05-13 03:28:32,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +27: [2023-05-13 03:28:32,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +27: [2023-05-13 03:28:32,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +16: [2023-05-13 03:28:32,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +20: [2023-05-13 03:28:32,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +16: [2023-05-13 03:28:32,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +16: [2023-05-13 03:28:32,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +16: [2023-05-13 03:28:32,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +16: [2023-05-13 03:28:32,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +16: [2023-05-13 03:28:32,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +16: [2023-05-13 03:28:32,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +16: [2023-05-13 03:28:32,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +20: [2023-05-13 03:28:32,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +20: [2023-05-13 03:28:32,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +20: [2023-05-13 03:28:32,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +20: [2023-05-13 03:28:32,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +20: [2023-05-13 03:28:32,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +16: [2023-05-13 03:28:32,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +28: [2023-05-13 03:28:32,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +16: [2023-05-13 03:28:32,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +16: [2023-05-13 03:28:32,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +16: [2023-05-13 03:28:32,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +16: [2023-05-13 03:28:32,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +16: [2023-05-13 03:28:32,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +16: [2023-05-13 03:28:32,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +16: [2023-05-13 03:28:32,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +28: [2023-05-13 03:28:32,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +28: [2023-05-13 03:28:32,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +28: [2023-05-13 03:28:32,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +28: [2023-05-13 03:28:32,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +28: [2023-05-13 03:28:32,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +28: [2023-05-13 03:28:32,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +28: [2023-05-13 03:28:32,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +28: [2023-05-13 03:28:32,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +20: [2023-05-13 03:28:32,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +20: [2023-05-13 03:28:32,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +28: [2023-05-13 03:28:32,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +28: [2023-05-13 03:28:32,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +28: [2023-05-13 03:28:32,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +28: [2023-05-13 03:28:32,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +28: [2023-05-13 03:28:32,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +16: [2023-05-13 03:28:32,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +16: [2023-05-13 03:28:32,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +20: [2023-05-13 03:28:32,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +16: [2023-05-13 03:28:32,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +16: [2023-05-13 03:28:32,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +16: [2023-05-13 03:28:32,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +16: [2023-05-13 03:28:32,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +30: [2023-05-13 03:28:32,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +30: [2023-05-13 03:28:32,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +30: [2023-05-13 03:28:32,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +30: [2023-05-13 03:28:32,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +30: [2023-05-13 03:28:32,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +30: [2023-05-13 03:28:32,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +30: [2023-05-13 03:28:32,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +30: [2023-05-13 03:28:32,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +22: [2023-05-13 03:28:32,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +22: [2023-05-13 03:28:32,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +16: [2023-05-13 03:28:32,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +22: [2023-05-13 03:28:32,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +22: [2023-05-13 03:28:32,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +22: [2023-05-13 03:28:32,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +22: [2023-05-13 03:28:32,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +22: [2023-05-13 03:28:32,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +22: [2023-05-13 03:28:32,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +16: [2023-05-13 03:28:32,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +20: [2023-05-13 03:28:32,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +20: [2023-05-13 03:28:32,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +20: [2023-05-13 03:28:32,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +30: [2023-05-13 03:28:32,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +20: [2023-05-13 03:28:32,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +20: [2023-05-13 03:28:32,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +20: [2023-05-13 03:28:32,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +30: [2023-05-13 03:28:32,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +30: [2023-05-13 03:28:32,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +30: [2023-05-13 03:28:32,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +20: [2023-05-13 03:28:32,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +30: [2023-05-13 03:28:32,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +22: [2023-05-13 03:28:32,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +22: [2023-05-13 03:28:32,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +30: [2023-05-13 03:28:32,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +30: [2023-05-13 03:28:32,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +30: [2023-05-13 03:28:32,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +22: [2023-05-13 03:28:32,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +22: [2023-05-13 03:28:32,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +22: [2023-05-13 03:28:32,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +22: [2023-05-13 03:28:32,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +16: [2023-05-13 03:28:32,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +15: [2023-05-13 03:28:32,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +15: [2023-05-13 03:28:32,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +15: [2023-05-13 03:28:32,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +15: [2023-05-13 03:28:32,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +15: [2023-05-13 03:28:32,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +22: [2023-05-13 03:28:32,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +15: [2023-05-13 03:28:32,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +15: [2023-05-13 03:28:32,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +15: [2023-05-13 03:28:32,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +22: [2023-05-13 03:28:32,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 4: [2023-05-13 03:28:32,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +18: [2023-05-13 03:28:32,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +18: [2023-05-13 03:28:32,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +18: [2023-05-13 03:28:32,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +18: [2023-05-13 03:28:32,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +16: [2023-05-13 03:28:32,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +18: [2023-05-13 03:28:32,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +18: [2023-05-13 03:28:32,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +18: [2023-05-13 03:28:32,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 4: [2023-05-13 03:28:32,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +18: [2023-05-13 03:28:32,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +20: [2023-05-13 03:28:32,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +15: [2023-05-13 03:28:32,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +18: [2023-05-13 03:28:32,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +18: [2023-05-13 03:28:32,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +16: [2023-05-13 03:28:32,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +18: [2023-05-13 03:28:32,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +16: [2023-05-13 03:28:32,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +15: [2023-05-13 03:28:32,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +18: [2023-05-13 03:28:32,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +18: [2023-05-13 03:28:32,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +18: [2023-05-13 03:28:32,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +18: [2023-05-13 03:28:32,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +15: [2023-05-13 03:28:32,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +15: [2023-05-13 03:28:32,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +18: [2023-05-13 03:28:32,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +15: [2023-05-13 03:28:32,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +15: [2023-05-13 03:28:32,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +15: [2023-05-13 03:28:32,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +15: [2023-05-13 03:28:32,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +16: [2023-05-13 03:28:32,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +16: [2023-05-13 03:28:32,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +16: [2023-05-13 03:28:32,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +16: [2023-05-13 03:28:32,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +20: [2023-05-13 03:28:32,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +20: [2023-05-13 03:28:32,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +20: [2023-05-13 03:28:32,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +20: [2023-05-13 03:28:32,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +20: [2023-05-13 03:28:32,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +14: [2023-05-13 03:28:32,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +14: [2023-05-13 03:28:32,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +14: [2023-05-13 03:28:32,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +14: [2023-05-13 03:28:32,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +14: [2023-05-13 03:28:32,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +14: [2023-05-13 03:28:32,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +14: [2023-05-13 03:28:32,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +14: [2023-05-13 03:28:32,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +30: [2023-05-13 03:28:32,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +30: [2023-05-13 03:28:32,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +19: [2023-05-13 03:28:32,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +19: [2023-05-13 03:28:32,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +23: [2023-05-13 03:28:32,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +23: [2023-05-13 03:28:32,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +26: [2023-05-13 03:28:32,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +26: [2023-05-13 03:28:32,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +19: [2023-05-13 03:28:32,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +19: [2023-05-13 03:28:32,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +19: [2023-05-13 03:28:32,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +19: [2023-05-13 03:28:32,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +19: [2023-05-13 03:28:32,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +19: [2023-05-13 03:28:32,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +22: [2023-05-13 03:28:32,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +22: [2023-05-13 03:28:32,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +23: [2023-05-13 03:28:32,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +11: [2023-05-13 03:28:32,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +23: [2023-05-13 03:28:32,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +23: [2023-05-13 03:28:32,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +23: [2023-05-13 03:28:32,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +23: [2023-05-13 03:28:32,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +14: [2023-05-13 03:28:32,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +23: [2023-05-13 03:28:32,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +26: [2023-05-13 03:28:32,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +26: [2023-05-13 03:28:32,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +26: [2023-05-13 03:28:32,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +26: [2023-05-13 03:28:32,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +26: [2023-05-13 03:28:32,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +26: [2023-05-13 03:28:32,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +26: [2023-05-13 03:28:32,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +26: [2023-05-13 03:28:32,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +11: [2023-05-13 03:28:32,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +11: [2023-05-13 03:28:32,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +11: [2023-05-13 03:28:32,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +11: [2023-05-13 03:28:32,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +11: [2023-05-13 03:28:32,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +11: [2023-05-13 03:28:32,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +30: [2023-05-13 03:28:32,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +11: [2023-05-13 03:28:32,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +23: [2023-05-13 03:28:32,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +14: [2023-05-13 03:28:32,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +14: [2023-05-13 03:28:32,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +14: [2023-05-13 03:28:32,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +14: [2023-05-13 03:28:32,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +14: [2023-05-13 03:28:32,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +11: [2023-05-13 03:28:32,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +19: [2023-05-13 03:28:32,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +19: [2023-05-13 03:28:32,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +23: [2023-05-13 03:28:32,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +19: [2023-05-13 03:28:32,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +14: [2023-05-13 03:28:32,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +19: [2023-05-13 03:28:32,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +19: [2023-05-13 03:28:32,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +25: [2023-05-13 03:28:32,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +25: [2023-05-13 03:28:32,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +23: [2023-05-13 03:28:32,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +25: [2023-05-13 03:28:32,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +14: [2023-05-13 03:28:32,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +19: [2023-05-13 03:28:32,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +26: [2023-05-13 03:28:32,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +25: [2023-05-13 03:28:32,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +25: [2023-05-13 03:28:32,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +25: [2023-05-13 03:28:32,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +25: [2023-05-13 03:28:32,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +25: [2023-05-13 03:28:32,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +19: [2023-05-13 03:28:32,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +26: [2023-05-13 03:28:32,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +19: [2023-05-13 03:28:32,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +30: [2023-05-13 03:28:32,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +30: [2023-05-13 03:28:32,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +30: [2023-05-13 03:28:32,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +30: [2023-05-13 03:28:32,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +15: [2023-05-13 03:28:32,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +23: [2023-05-13 03:28:32,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +23: [2023-05-13 03:28:32,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +30: [2023-05-13 03:28:32,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +26: [2023-05-13 03:28:32,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +26: [2023-05-13 03:28:32,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +23: [2023-05-13 03:28:32,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +23: [2023-05-13 03:28:32,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +26: [2023-05-13 03:28:32,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +25: [2023-05-13 03:28:32,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +26: [2023-05-13 03:28:32,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +23: [2023-05-13 03:28:32,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +25: [2023-05-13 03:28:32,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +25: [2023-05-13 03:28:32,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +25: [2023-05-13 03:28:32,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +11: [2023-05-13 03:28:32,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +11: [2023-05-13 03:28:32,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +11: [2023-05-13 03:28:32,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +18: [2023-05-13 03:28:32,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +25: [2023-05-13 03:28:32,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +11: [2023-05-13 03:28:32,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +11: [2023-05-13 03:28:32,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +11: [2023-05-13 03:28:32,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +11: [2023-05-13 03:28:32,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +25: [2023-05-13 03:28:32,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +25: [2023-05-13 03:28:32,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +18: [2023-05-13 03:28:32,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +18: [2023-05-13 03:28:32,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +31: [2023-05-13 03:28:32,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +31: [2023-05-13 03:28:32,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +25: [2023-05-13 03:28:32,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +31: [2023-05-13 03:28:32,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +31: [2023-05-13 03:28:32,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +31: [2023-05-13 03:28:32,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +31: [2023-05-13 03:28:32,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +31: [2023-05-13 03:28:32,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +31: [2023-05-13 03:28:32,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +24: [2023-05-13 03:28:32,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +24: [2023-05-13 03:28:32,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +12: [2023-05-13 03:28:32,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +12: [2023-05-13 03:28:32,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +12: [2023-05-13 03:28:32,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +12: [2023-05-13 03:28:32,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +12: [2023-05-13 03:28:32,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +12: [2023-05-13 03:28:32,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +12: [2023-05-13 03:28:32,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +17: [2023-05-13 03:28:32,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +12: [2023-05-13 03:28:32,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +24: [2023-05-13 03:28:32,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +24: [2023-05-13 03:28:32,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +24: [2023-05-13 03:28:32,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +24: [2023-05-13 03:28:32,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +24: [2023-05-13 03:28:32,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +30: [2023-05-13 03:28:32,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +24: [2023-05-13 03:28:32,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +17: [2023-05-13 03:28:32,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +17: [2023-05-13 03:28:32,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +17: [2023-05-13 03:28:32,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +17: [2023-05-13 03:28:32,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +17: [2023-05-13 03:28:32,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +17: [2023-05-13 03:28:32,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +22: [2023-05-13 03:28:32,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +22: [2023-05-13 03:28:32,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +17: [2023-05-13 03:28:32,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +31: [2023-05-13 03:28:32,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +31: [2023-05-13 03:28:32,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +12: [2023-05-13 03:28:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +17: [2023-05-13 03:28:32,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +22: [2023-05-13 03:28:32,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +22: [2023-05-13 03:28:32,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +22: [2023-05-13 03:28:32,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +22: [2023-05-13 03:28:32,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +18: [2023-05-13 03:28:32,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +22: [2023-05-13 03:28:32,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +12: [2023-05-13 03:28:32,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +22: [2023-05-13 03:28:32,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +12: [2023-05-13 03:28:32,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +12: [2023-05-13 03:28:32,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +24: [2023-05-13 03:28:32,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +12: [2023-05-13 03:28:32,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +24: [2023-05-13 03:28:32,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +24: [2023-05-13 03:28:32,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +30: [2023-05-13 03:28:32,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +12: [2023-05-13 03:28:32,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +12: [2023-05-13 03:28:32,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +24: [2023-05-13 03:28:32,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +24: [2023-05-13 03:28:32,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +24: [2023-05-13 03:28:32,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +24: [2023-05-13 03:28:32,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +29: [2023-05-13 03:28:32,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +29: [2023-05-13 03:28:32,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +12: [2023-05-13 03:28:32,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +24: [2023-05-13 03:28:32,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +31: [2023-05-13 03:28:32,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +31: [2023-05-13 03:28:32,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +18: [2023-05-13 03:28:32,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +18: [2023-05-13 03:28:32,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +18: [2023-05-13 03:28:32,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +18: [2023-05-13 03:28:32,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +15: [2023-05-13 03:28:32,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:32,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +31: [2023-05-13 03:28:32,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +31: [2023-05-13 03:28:32,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +31: [2023-05-13 03:28:32,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +29: [2023-05-13 03:28:32,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +29: [2023-05-13 03:28:32,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +29: [2023-05-13 03:28:32,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +29: [2023-05-13 03:28:32,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +29: [2023-05-13 03:28:32,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +29: [2023-05-13 03:28:32,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +29: [2023-05-13 03:28:32,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +17: [2023-05-13 03:28:32,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +17: [2023-05-13 03:28:32,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +29: [2023-05-13 03:28:32,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +17: [2023-05-13 03:28:32,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +17: [2023-05-13 03:28:32,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +30: [2023-05-13 03:28:32,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +17: [2023-05-13 03:28:32,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +17: [2023-05-13 03:28:32,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +17: [2023-05-13 03:28:32,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +15: [2023-05-13 03:28:32,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +15: [2023-05-13 03:28:32,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +15: [2023-05-13 03:28:32,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +15: [2023-05-13 03:28:32,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +30: [2023-05-13 03:28:32,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +18: [2023-05-13 03:28:32,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +18: [2023-05-13 03:28:32,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +18: [2023-05-13 03:28:32,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +15: [2023-05-13 03:28:32,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +15: [2023-05-13 03:28:32,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +15: [2023-05-13 03:28:32,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +29: [2023-05-13 03:28:32,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +29: [2023-05-13 03:28:32,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +30: [2023-05-13 03:28:32,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +30: [2023-05-13 03:28:32,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:32,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +29: [2023-05-13 03:28:32,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +29: [2023-05-13 03:28:32,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... +29: [2023-05-13 03:28:32,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +30: [2023-05-13 03:28:32,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +30: [2023-05-13 03:28:32,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +23: [2023-05-13 03:28:32,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +14: [2023-05-13 03:28:32,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +14: [2023-05-13 03:28:32,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +26: [2023-05-13 03:28:32,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +26: [2023-05-13 03:28:32,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +22: [2023-05-13 03:28:32,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +11: [2023-05-13 03:28:32,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +18: [2023-05-13 03:28:32,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +18: [2023-05-13 03:28:32,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +22: [2023-05-13 03:28:32,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +18: [2023-05-13 03:28:32,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +22: [2023-05-13 03:28:32,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +22: [2023-05-13 03:28:32,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +22: [2023-05-13 03:28:32,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +18: [2023-05-13 03:28:32,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +18: [2023-05-13 03:28:32,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +22: [2023-05-13 03:28:32,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +19: [2023-05-13 03:28:32,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 0: [2023-05-13 03:28:32,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +23: [2023-05-13 03:28:32,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +14: [2023-05-13 03:28:32,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +26: [2023-05-13 03:28:32,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:32,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 0: [2023-05-13 03:28:32,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +19: [2023-05-13 03:28:32,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +19: [2023-05-13 03:28:32,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +26: [2023-05-13 03:28:32,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +15: [2023-05-13 03:28:32,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +23: [2023-05-13 03:28:32,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +11: [2023-05-13 03:28:32,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +25: [2023-05-13 03:28:32,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +25: [2023-05-13 03:28:32,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +25: [2023-05-13 03:28:32,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +12: [2023-05-13 03:28:32,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +25: [2023-05-13 03:28:32,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +25: [2023-05-13 03:28:32,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +14: [2023-05-13 03:28:32,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +19: [2023-05-13 03:28:32,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +19: [2023-05-13 03:28:32,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +17: [2023-05-13 03:28:32,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +14: [2023-05-13 03:28:32,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +19: [2023-05-13 03:28:32,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +19: [2023-05-13 03:28:32,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +19: [2023-05-13 03:28:32,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +14: [2023-05-13 03:28:32,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +15: [2023-05-13 03:28:32,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +26: [2023-05-13 03:28:32,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +26: [2023-05-13 03:28:32,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +14: [2023-05-13 03:28:32,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +14: [2023-05-13 03:28:32,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +14: [2023-05-13 03:28:32,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +14: [2023-05-13 03:28:32,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +15: [2023-05-13 03:28:32,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:32,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +15: [2023-05-13 03:28:32,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +15: [2023-05-13 03:28:32,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +15: [2023-05-13 03:28:32,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +15: [2023-05-13 03:28:32,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +26: [2023-05-13 03:28:32,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +26: [2023-05-13 03:28:32,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +25: [2023-05-13 03:28:32,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +31: [2023-05-13 03:28:32,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +23: [2023-05-13 03:28:32,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +26: [2023-05-13 03:28:32,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +26: [2023-05-13 03:28:32,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +23: [2023-05-13 03:28:32,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +12: [2023-05-13 03:28:32,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +12: [2023-05-13 03:28:32,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +24: [2023-05-13 03:28:32,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +24: [2023-05-13 03:28:32,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +24: [2023-05-13 03:28:32,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +24: [2023-05-13 03:28:32,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +23: [2023-05-13 03:28:32,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +23: [2023-05-13 03:28:32,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +23: [2023-05-13 03:28:32,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +26: [2023-05-13 03:28:32,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:32,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +23: [2023-05-13 03:28:32,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +11: [2023-05-13 03:28:32,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +11: [2023-05-13 03:28:32,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +11: [2023-05-13 03:28:32,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +23: [2023-05-13 03:28:32,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +24: [2023-05-13 03:28:32,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +14: [2023-05-13 03:28:32,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +19: [2023-05-13 03:28:32,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +19: [2023-05-13 03:28:32,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:32,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +11: [2023-05-13 03:28:32,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +11: [2023-05-13 03:28:32,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +11: [2023-05-13 03:28:32,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +11: [2023-05-13 03:28:32,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +17: [2023-05-13 03:28:32,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +12: [2023-05-13 03:28:32,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +12: [2023-05-13 03:28:32,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +12: [2023-05-13 03:28:32,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +19: [2023-05-13 03:28:32,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +12: [2023-05-13 03:28:32,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +12: [2023-05-13 03:28:32,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +12: [2023-05-13 03:28:32,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 7: [2023-05-13 03:28:32,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +25: [2023-05-13 03:28:32,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +25: [2023-05-13 03:28:32,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +26: [2023-05-13 03:28:32,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:32,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 7: [2023-05-13 03:28:32,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 2: [2023-05-13 03:28:32,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +25: [2023-05-13 03:28:32,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +25: [2023-05-13 03:28:32,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +24: [2023-05-13 03:28:32,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +24: [2023-05-13 03:28:32,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +24: [2023-05-13 03:28:32,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:32,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +31: [2023-05-13 03:28:32,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +31: [2023-05-13 03:28:32,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +25: [2023-05-13 03:28:32,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +25: [2023-05-13 03:28:32,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +25: [2023-05-13 03:28:32,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +14: [2023-05-13 03:28:32,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +14: [2023-05-13 03:28:32,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 1: [2023-05-13 03:28:32,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:32,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +31: [2023-05-13 03:28:32,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +31: [2023-05-13 03:28:32,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 1: [2023-05-13 03:28:32,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +19: [2023-05-13 03:28:32,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +19: [2023-05-13 03:28:32,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +14: [2023-05-13 03:28:32,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +14: [2023-05-13 03:28:32,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +14: [2023-05-13 03:28:32,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +19: [2023-05-13 03:28:32,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +19: [2023-05-13 03:28:32,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +12: [2023-05-13 03:28:32,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +26: [2023-05-13 03:28:32,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +24: [2023-05-13 03:28:32,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:32,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +29: [2023-05-13 03:28:32,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +19: [2023-05-13 03:28:32,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +25: [2023-05-13 03:28:32,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +24: [2023-05-13 03:28:32,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +26: [2023-05-13 03:28:32,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +26: [2023-05-13 03:28:32,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +24: [2023-05-13 03:28:32,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +24: [2023-05-13 03:28:32,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:32,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +26: [2023-05-13 03:28:32,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +23: [2023-05-13 03:28:32,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +17: [2023-05-13 03:28:32,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +17: [2023-05-13 03:28:32,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +17: [2023-05-13 03:28:32,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +17: [2023-05-13 03:28:32,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +17: [2023-05-13 03:28:32,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +17: [2023-05-13 03:28:32,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +17: [2023-05-13 03:28:32,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 3: [2023-05-13 03:28:32,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +12: [2023-05-13 03:28:32,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 3: [2023-05-13 03:28:32,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +24: [2023-05-13 03:28:32,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +23: [2023-05-13 03:28:32,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +23: [2023-05-13 03:28:32,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:32,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +29: [2023-05-13 03:28:32,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +29: [2023-05-13 03:28:32,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +29: [2023-05-13 03:28:32,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +23: [2023-05-13 03:28:32,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +23: [2023-05-13 03:28:32,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +12: [2023-05-13 03:28:32,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 6: [2023-05-13 03:28:32,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. +25: [2023-05-13 03:28:32,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +23: [2023-05-13 03:28:32,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +12: [2023-05-13 03:28:32,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +12: [2023-05-13 03:28:32,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +25: [2023-05-13 03:28:32,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +12: [2023-05-13 03:28:32,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +11: [2023-05-13 03:28:32,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +11: [2023-05-13 03:28:32,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +12: [2023-05-13 03:28:32,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +11: [2023-05-13 03:28:32,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +11: [2023-05-13 03:28:32,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +24: [2023-05-13 03:28:32,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +24: [2023-05-13 03:28:32,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +11: [2023-05-13 03:28:32,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +24: [2023-05-13 03:28:32,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +11: [2023-05-13 03:28:32,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +11: [2023-05-13 03:28:32,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 2: [2023-05-13 03:28:32,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:32,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:32,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:32,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:32,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:32,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:32,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:32,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:32,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:32,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:32,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:32,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +17: [2023-05-13 03:28:32,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:32,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:32,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +17: [2023-05-13 03:28:32,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +17: [2023-05-13 03:28:32,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 6: [2023-05-13 03:28:32,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +17: [2023-05-13 03:28:32,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +17: [2023-05-13 03:28:32,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +17: [2023-05-13 03:28:32,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +17: [2023-05-13 03:28:32,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_25-model_00-model_states.pt. + 9: [2023-05-13 03:28:32,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 9: [2023-05-13 03:28:32,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +13: [2023-05-13 03:28:33,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +13: [2023-05-13 03:28:33,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +13: [2023-05-13 03:28:33,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +13: [2023-05-13 03:28:33,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +13: [2023-05-13 03:28:33,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +13: [2023-05-13 03:28:33,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +13: [2023-05-13 03:28:33,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +13: [2023-05-13 03:28:33,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +13: [2023-05-13 03:28:33,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +13: [2023-05-13 03:28:33,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +13: [2023-05-13 03:28:33,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +13: [2023-05-13 03:28:33,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +13: [2023-05-13 03:28:33,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +13: [2023-05-13 03:28:33,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +13: [2023-05-13 03:28:33,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +13: [2023-05-13 03:28:33,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +13: [2023-05-13 03:28:33,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +13: [2023-05-13 03:28:33,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +13: [2023-05-13 03:28:33,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +13: [2023-05-13 03:28:33,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +13: [2023-05-13 03:28:33,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +13: [2023-05-13 03:28:33,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +13: [2023-05-13 03:28:33,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +13: [2023-05-13 03:28:33,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +30: [2023-05-13 03:28:33,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +30: [2023-05-13 03:28:33,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +13: [2023-05-13 03:28:33,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +13: [2023-05-13 03:28:33,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +30: [2023-05-13 03:28:33,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +30: [2023-05-13 03:28:33,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +30: [2023-05-13 03:28:33,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +30: [2023-05-13 03:28:33,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +30: [2023-05-13 03:28:33,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +30: [2023-05-13 03:28:33,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +13: [2023-05-13 03:28:33,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +13: [2023-05-13 03:28:33,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +30: [2023-05-13 03:28:33,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +30: [2023-05-13 03:28:33,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +30: [2023-05-13 03:28:33,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +30: [2023-05-13 03:28:33,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +30: [2023-05-13 03:28:33,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +30: [2023-05-13 03:28:33,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +30: [2023-05-13 03:28:33,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +30: [2023-05-13 03:28:33,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +21: [2023-05-13 03:28:33,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +21: [2023-05-13 03:28:33,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +21: [2023-05-13 03:28:33,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +21: [2023-05-13 03:28:33,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +21: [2023-05-13 03:28:33,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +21: [2023-05-13 03:28:33,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +21: [2023-05-13 03:28:33,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +21: [2023-05-13 03:28:33,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +13: [2023-05-13 03:28:33,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +13: [2023-05-13 03:28:33,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +21: [2023-05-13 03:28:33,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +21: [2023-05-13 03:28:33,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +21: [2023-05-13 03:28:33,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +13: [2023-05-13 03:28:33,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +13: [2023-05-13 03:28:33,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +21: [2023-05-13 03:28:33,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +21: [2023-05-13 03:28:33,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +21: [2023-05-13 03:28:33,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +21: [2023-05-13 03:28:33,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +21: [2023-05-13 03:28:33,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +30: [2023-05-13 03:28:33,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +30: [2023-05-13 03:28:33,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +30: [2023-05-13 03:28:33,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +30: [2023-05-13 03:28:33,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +30: [2023-05-13 03:28:33,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +21: [2023-05-13 03:28:33,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +21: [2023-05-13 03:28:33,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +21: [2023-05-13 03:28:33,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +21: [2023-05-13 03:28:33,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +30: [2023-05-13 03:28:33,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +30: [2023-05-13 03:28:33,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +30: [2023-05-13 03:28:33,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +30: [2023-05-13 03:28:33,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +30: [2023-05-13 03:28:33,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +30: [2023-05-13 03:28:33,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +21: [2023-05-13 03:28:33,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +30: [2023-05-13 03:28:33,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +30: [2023-05-13 03:28:33,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +21: [2023-05-13 03:28:33,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +21: [2023-05-13 03:28:33,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +21: [2023-05-13 03:28:33,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +21: [2023-05-13 03:28:33,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +21: [2023-05-13 03:28:33,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +21: [2023-05-13 03:28:33,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +21: [2023-05-13 03:28:33,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +19: [2023-05-13 03:28:33,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +19: [2023-05-13 03:28:33,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +19: [2023-05-13 03:28:33,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +30: [2023-05-13 03:28:33,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +19: [2023-05-13 03:28:33,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +19: [2023-05-13 03:28:33,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +19: [2023-05-13 03:28:33,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +19: [2023-05-13 03:28:33,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +19: [2023-05-13 03:28:33,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +30: [2023-05-13 03:28:33,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +30: [2023-05-13 03:28:33,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +19: [2023-05-13 03:28:33,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +19: [2023-05-13 03:28:33,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +19: [2023-05-13 03:28:33,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +19: [2023-05-13 03:28:33,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +19: [2023-05-13 03:28:33,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +19: [2023-05-13 03:28:33,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +19: [2023-05-13 03:28:33,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +19: [2023-05-13 03:28:33,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +21: [2023-05-13 03:28:33,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +21: [2023-05-13 03:28:33,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +21: [2023-05-13 03:28:33,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +21: [2023-05-13 03:28:33,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +23: [2023-05-13 03:28:33,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +23: [2023-05-13 03:28:33,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +23: [2023-05-13 03:28:33,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +23: [2023-05-13 03:28:33,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +23: [2023-05-13 03:28:33,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +10: [2023-05-13 03:28:33,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +10: [2023-05-13 03:28:33,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +23: [2023-05-13 03:28:33,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +23: [2023-05-13 03:28:33,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +23: [2023-05-13 03:28:33,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +10: [2023-05-13 03:28:33,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +10: [2023-05-13 03:28:33,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +10: [2023-05-13 03:28:33,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +10: [2023-05-13 03:28:33,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +10: [2023-05-13 03:28:33,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +10: [2023-05-13 03:28:33,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +10: [2023-05-13 03:28:33,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +10: [2023-05-13 03:28:33,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +23: [2023-05-13 03:28:33,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +23: [2023-05-13 03:28:33,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +23: [2023-05-13 03:28:33,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +23: [2023-05-13 03:28:33,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +23: [2023-05-13 03:28:33,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +10: [2023-05-13 03:28:33,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +10: [2023-05-13 03:28:33,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +23: [2023-05-13 03:28:33,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +23: [2023-05-13 03:28:33,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +23: [2023-05-13 03:28:33,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +10: [2023-05-13 03:28:33,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +10: [2023-05-13 03:28:33,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +10: [2023-05-13 03:28:33,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +10: [2023-05-13 03:28:33,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +15: [2023-05-13 03:28:33,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +15: [2023-05-13 03:28:33,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +15: [2023-05-13 03:28:33,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +15: [2023-05-13 03:28:33,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +15: [2023-05-13 03:28:33,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +15: [2023-05-13 03:28:33,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +15: [2023-05-13 03:28:33,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +15: [2023-05-13 03:28:33,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +15: [2023-05-13 03:28:33,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +15: [2023-05-13 03:28:33,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +15: [2023-05-13 03:28:33,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +15: [2023-05-13 03:28:33,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +15: [2023-05-13 03:28:33,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +15: [2023-05-13 03:28:33,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +15: [2023-05-13 03:28:33,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +15: [2023-05-13 03:28:33,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +19: [2023-05-13 03:28:33,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +19: [2023-05-13 03:28:33,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +19: [2023-05-13 03:28:33,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +19: [2023-05-13 03:28:33,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +10: [2023-05-13 03:28:33,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +10: [2023-05-13 03:28:33,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +27: [2023-05-13 03:28:33,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +23: [2023-05-13 03:28:33,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +19: [2023-05-13 03:28:33,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +19: [2023-05-13 03:28:33,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +19: [2023-05-13 03:28:33,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +23: [2023-05-13 03:28:33,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +31: [2023-05-13 03:28:33,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +31: [2023-05-13 03:28:33,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +27: [2023-05-13 03:28:33,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +27: [2023-05-13 03:28:33,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +27: [2023-05-13 03:28:33,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +27: [2023-05-13 03:28:33,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +27: [2023-05-13 03:28:33,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +27: [2023-05-13 03:28:33,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +31: [2023-05-13 03:28:33,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +31: [2023-05-13 03:28:33,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +31: [2023-05-13 03:28:33,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +31: [2023-05-13 03:28:33,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +31: [2023-05-13 03:28:33,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +27: [2023-05-13 03:28:33,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +31: [2023-05-13 03:28:33,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +16: [2023-05-13 03:28:33,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +16: [2023-05-13 03:28:33,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +16: [2023-05-13 03:28:33,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +16: [2023-05-13 03:28:33,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +16: [2023-05-13 03:28:33,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +16: [2023-05-13 03:28:33,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +16: [2023-05-13 03:28:33,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +16: [2023-05-13 03:28:33,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +24: [2023-05-13 03:28:33,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +24: [2023-05-13 03:28:33,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +24: [2023-05-13 03:28:33,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +24: [2023-05-13 03:28:33,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +24: [2023-05-13 03:28:33,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +24: [2023-05-13 03:28:33,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +24: [2023-05-13 03:28:33,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +24: [2023-05-13 03:28:33,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +27: [2023-05-13 03:28:33,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:33,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:33,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +16: [2023-05-13 03:28:33,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +27: [2023-05-13 03:28:33,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +24: [2023-05-13 03:28:33,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +23: [2023-05-13 03:28:33,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +16: [2023-05-13 03:28:33,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +24: [2023-05-13 03:28:33,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:33,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:33,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +16: [2023-05-13 03:28:33,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +16: [2023-05-13 03:28:33,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +16: [2023-05-13 03:28:33,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +24: [2023-05-13 03:28:33,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +16: [2023-05-13 03:28:33,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +16: [2023-05-13 03:28:33,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +31: [2023-05-13 03:28:33,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +31: [2023-05-13 03:28:33,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +27: [2023-05-13 03:28:33,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +16: [2023-05-13 03:28:33,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:33,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +24: [2023-05-13 03:28:33,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +27: [2023-05-13 03:28:33,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +27: [2023-05-13 03:28:33,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:33,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +24: [2023-05-13 03:28:33,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +24: [2023-05-13 03:28:33,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +24: [2023-05-13 03:28:33,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +24: [2023-05-13 03:28:33,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +27: [2023-05-13 03:28:33,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +27: [2023-05-13 03:28:33,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +27: [2023-05-13 03:28:33,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +10: [2023-05-13 03:28:33,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +10: [2023-05-13 03:28:33,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +10: [2023-05-13 03:28:33,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +10: [2023-05-13 03:28:33,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +10: [2023-05-13 03:28:33,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +10: [2023-05-13 03:28:33,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +10: [2023-05-13 03:28:33,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +10: [2023-05-13 03:28:33,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +23: [2023-05-13 03:28:33,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +23: [2023-05-13 03:28:33,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +23: [2023-05-13 03:28:33,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +23: [2023-05-13 03:28:33,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +23: [2023-05-13 03:28:33,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +15: [2023-05-13 03:28:33,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +23: [2023-05-13 03:28:33,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +23: [2023-05-13 03:28:33,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +23: [2023-05-13 03:28:33,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +19: [2023-05-13 03:28:33,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +19: [2023-05-13 03:28:33,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +19: [2023-05-13 03:28:33,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +19: [2023-05-13 03:28:33,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +19: [2023-05-13 03:28:33,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +19: [2023-05-13 03:28:33,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +19: [2023-05-13 03:28:33,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +19: [2023-05-13 03:28:33,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +19: [2023-05-13 03:28:33,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +15: [2023-05-13 03:28:33,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +24: [2023-05-13 03:28:33,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +15: [2023-05-13 03:28:33,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +15: [2023-05-13 03:28:33,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +15: [2023-05-13 03:28:33,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +31: [2023-05-13 03:28:33,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +31: [2023-05-13 03:28:33,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +16: [2023-05-13 03:28:33,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +10: [2023-05-13 03:28:33,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +15: [2023-05-13 03:28:33,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +15: [2023-05-13 03:28:33,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +27: [2023-05-13 03:28:33,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +15: [2023-05-13 03:28:33,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +15: [2023-05-13 03:28:33,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +23: [2023-05-13 03:28:33,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +10: [2023-05-13 03:28:33,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +10: [2023-05-13 03:28:33,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +23: [2023-05-13 03:28:33,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +23: [2023-05-13 03:28:33,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +10: [2023-05-13 03:28:33,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +10: [2023-05-13 03:28:33,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +10: [2023-05-13 03:28:33,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +23: [2023-05-13 03:28:33,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +23: [2023-05-13 03:28:33,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +16: [2023-05-13 03:28:33,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +24: [2023-05-13 03:28:33,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +16: [2023-05-13 03:28:33,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +24: [2023-05-13 03:28:33,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +14: [2023-05-13 03:28:33,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +14: [2023-05-13 03:28:33,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +14: [2023-05-13 03:28:33,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +14: [2023-05-13 03:28:33,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +14: [2023-05-13 03:28:33,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +14: [2023-05-13 03:28:33,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +14: [2023-05-13 03:28:33,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +14: [2023-05-13 03:28:33,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +16: [2023-05-13 03:28:33,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +16: [2023-05-13 03:28:33,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +16: [2023-05-13 03:28:33,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +16: [2023-05-13 03:28:33,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +16: [2023-05-13 03:28:33,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +14: [2023-05-13 03:28:33,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +14: [2023-05-13 03:28:33,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +14: [2023-05-13 03:28:33,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +24: [2023-05-13 03:28:33,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +14: [2023-05-13 03:28:33,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:33,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +24: [2023-05-13 03:28:33,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +14: [2023-05-13 03:28:33,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +16: [2023-05-13 03:28:33,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +14: [2023-05-13 03:28:33,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +14: [2023-05-13 03:28:33,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:33,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +31: [2023-05-13 03:28:33,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +31: [2023-05-13 03:28:33,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +14: [2023-05-13 03:28:33,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +27: [2023-05-13 03:28:33,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +24: [2023-05-13 03:28:33,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +24: [2023-05-13 03:28:33,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +24: [2023-05-13 03:28:33,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +24: [2023-05-13 03:28:33,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +31: [2023-05-13 03:28:33,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +31: [2023-05-13 03:28:33,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +31: [2023-05-13 03:28:33,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +31: [2023-05-13 03:28:33,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +27: [2023-05-13 03:28:33,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +15: [2023-05-13 03:28:33,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +27: [2023-05-13 03:28:33,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +16: [2023-05-13 03:28:33,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +27: [2023-05-13 03:28:33,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +18: [2023-05-13 03:28:33,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +18: [2023-05-13 03:28:33,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +18: [2023-05-13 03:28:33,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +18: [2023-05-13 03:28:33,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +18: [2023-05-13 03:28:33,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +18: [2023-05-13 03:28:33,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +18: [2023-05-13 03:28:33,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +15: [2023-05-13 03:28:33,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +15: [2023-05-13 03:28:33,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +15: [2023-05-13 03:28:33,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +15: [2023-05-13 03:28:33,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +24: [2023-05-13 03:28:33,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +18: [2023-05-13 03:28:33,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +15: [2023-05-13 03:28:33,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +16: [2023-05-13 03:28:33,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +15: [2023-05-13 03:28:33,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +18: [2023-05-13 03:28:33,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +24: [2023-05-13 03:28:33,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +24: [2023-05-13 03:28:33,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +18: [2023-05-13 03:28:33,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +16: [2023-05-13 03:28:33,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +16: [2023-05-13 03:28:33,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +27: [2023-05-13 03:28:33,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +27: [2023-05-13 03:28:33,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +27: [2023-05-13 03:28:33,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +27: [2023-05-13 03:28:33,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +16: [2023-05-13 03:28:33,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +16: [2023-05-13 03:28:33,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +16: [2023-05-13 03:28:33,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +24: [2023-05-13 03:28:33,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:33,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:33,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +24: [2023-05-13 03:28:33,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +31: [2023-05-13 03:28:33,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +31: [2023-05-13 03:28:33,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +24: [2023-05-13 03:28:33,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +24: [2023-05-13 03:28:33,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +31: [2023-05-13 03:28:33,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +31: [2023-05-13 03:28:33,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +14: [2023-05-13 03:28:33,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +14: [2023-05-13 03:28:33,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +14: [2023-05-13 03:28:33,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +27: [2023-05-13 03:28:33,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +27: [2023-05-13 03:28:33,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +27: [2023-05-13 03:28:33,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +27: [2023-05-13 03:28:33,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +27: [2023-05-13 03:28:33,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +27: [2023-05-13 03:28:33,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +27: [2023-05-13 03:28:33,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +14: [2023-05-13 03:28:33,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +14: [2023-05-13 03:28:33,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +14: [2023-05-13 03:28:33,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +14: [2023-05-13 03:28:33,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +14: [2023-05-13 03:28:33,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +18: [2023-05-13 03:28:33,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +18: [2023-05-13 03:28:33,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +14: [2023-05-13 03:28:33,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +14: [2023-05-13 03:28:33,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +14: [2023-05-13 03:28:33,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +18: [2023-05-13 03:28:33,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +18: [2023-05-13 03:28:33,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +18: [2023-05-13 03:28:33,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +14: [2023-05-13 03:28:33,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +14: [2023-05-13 03:28:33,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +14: [2023-05-13 03:28:33,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +14: [2023-05-13 03:28:33,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +14: [2023-05-13 03:28:33,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +18: [2023-05-13 03:28:33,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +22: [2023-05-13 03:28:33,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +22: [2023-05-13 03:28:33,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +22: [2023-05-13 03:28:33,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +22: [2023-05-13 03:28:33,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +11: [2023-05-13 03:28:33,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +22: [2023-05-13 03:28:33,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +22: [2023-05-13 03:28:33,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +22: [2023-05-13 03:28:33,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +22: [2023-05-13 03:28:33,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +11: [2023-05-13 03:28:33,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +11: [2023-05-13 03:28:33,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +11: [2023-05-13 03:28:33,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +11: [2023-05-13 03:28:33,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +11: [2023-05-13 03:28:33,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +11: [2023-05-13 03:28:33,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +11: [2023-05-13 03:28:33,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +11: [2023-05-13 03:28:33,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +22: [2023-05-13 03:28:33,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +22: [2023-05-13 03:28:33,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +18: [2023-05-13 03:28:33,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +22: [2023-05-13 03:28:33,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +18: [2023-05-13 03:28:33,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +22: [2023-05-13 03:28:33,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +22: [2023-05-13 03:28:33,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +18: [2023-05-13 03:28:33,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +22: [2023-05-13 03:28:33,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +22: [2023-05-13 03:28:33,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +22: [2023-05-13 03:28:33,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +11: [2023-05-13 03:28:33,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +11: [2023-05-13 03:28:33,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +11: [2023-05-13 03:28:33,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +11: [2023-05-13 03:28:33,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +11: [2023-05-13 03:28:33,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +11: [2023-05-13 03:28:33,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +11: [2023-05-13 03:28:33,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +28: [2023-05-13 03:28:33,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +28: [2023-05-13 03:28:33,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +28: [2023-05-13 03:28:33,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +28: [2023-05-13 03:28:33,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +28: [2023-05-13 03:28:33,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +28: [2023-05-13 03:28:33,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +28: [2023-05-13 03:28:33,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +28: [2023-05-13 03:28:33,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +28: [2023-05-13 03:28:33,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +28: [2023-05-13 03:28:33,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +28: [2023-05-13 03:28:33,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +28: [2023-05-13 03:28:33,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +28: [2023-05-13 03:28:33,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +28: [2023-05-13 03:28:33,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +28: [2023-05-13 03:28:33,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +28: [2023-05-13 03:28:33,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:33,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +29: [2023-05-13 03:28:33,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +29: [2023-05-13 03:28:33,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +29: [2023-05-13 03:28:33,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +29: [2023-05-13 03:28:33,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +29: [2023-05-13 03:28:33,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +29: [2023-05-13 03:28:33,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +29: [2023-05-13 03:28:33,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +11: [2023-05-13 03:28:33,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +29: [2023-05-13 03:28:33,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:33,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:33,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:33,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:33,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:33,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:33,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:33,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +22: [2023-05-13 03:28:33,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +22: [2023-05-13 03:28:33,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +20: [2023-05-13 03:28:33,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +20: [2023-05-13 03:28:33,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +20: [2023-05-13 03:28:33,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +20: [2023-05-13 03:28:33,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +20: [2023-05-13 03:28:33,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +20: [2023-05-13 03:28:33,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +20: [2023-05-13 03:28:33,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +20: [2023-05-13 03:28:33,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +11: [2023-05-13 03:28:33,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 0: [2023-05-13 03:28:33,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 0: [2023-05-13 03:28:33,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 0: [2023-05-13 03:28:33,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 0: [2023-05-13 03:28:33,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 0: [2023-05-13 03:28:33,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 0: [2023-05-13 03:28:33,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 0: [2023-05-13 03:28:33,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +20: [2023-05-13 03:28:33,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +20: [2023-05-13 03:28:33,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +20: [2023-05-13 03:28:33,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +17: [2023-05-13 03:28:33,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +17: [2023-05-13 03:28:33,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +17: [2023-05-13 03:28:33,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +17: [2023-05-13 03:28:33,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +17: [2023-05-13 03:28:33,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +17: [2023-05-13 03:28:33,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +17: [2023-05-13 03:28:33,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +17: [2023-05-13 03:28:33,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +22: [2023-05-13 03:28:33,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +28: [2023-05-13 03:28:33,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +17: [2023-05-13 03:28:33,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +20: [2023-05-13 03:28:33,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +20: [2023-05-13 03:28:33,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +20: [2023-05-13 03:28:33,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +22: [2023-05-13 03:28:33,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +22: [2023-05-13 03:28:33,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 0: [2023-05-13 03:28:33,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +20: [2023-05-13 03:28:33,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +11: [2023-05-13 03:28:33,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +20: [2023-05-13 03:28:33,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +17: [2023-05-13 03:28:33,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +22: [2023-05-13 03:28:33,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +22: [2023-05-13 03:28:33,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +22: [2023-05-13 03:28:33,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +22: [2023-05-13 03:28:33,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +22: [2023-05-13 03:28:33,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +11: [2023-05-13 03:28:33,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +11: [2023-05-13 03:28:33,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +11: [2023-05-13 03:28:33,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 0: [2023-05-13 03:28:33,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +17: [2023-05-13 03:28:33,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +17: [2023-05-13 03:28:33,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +17: [2023-05-13 03:28:33,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +17: [2023-05-13 03:28:33,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +17: [2023-05-13 03:28:33,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +17: [2023-05-13 03:28:33,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +21: [2023-05-13 03:28:33,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +21: [2023-05-13 03:28:33,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +21: [2023-05-13 03:28:33,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +21: [2023-05-13 03:28:33,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +11: [2023-05-13 03:28:33,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +11: [2023-05-13 03:28:33,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +11: [2023-05-13 03:28:33,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +21: [2023-05-13 03:28:33,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +21: [2023-05-13 03:28:33,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +21: [2023-05-13 03:28:33,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +21: [2023-05-13 03:28:33,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +21: [2023-05-13 03:28:33,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +21: [2023-05-13 03:28:33,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +21: [2023-05-13 03:28:33,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +28: [2023-05-13 03:28:33,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +21: [2023-05-13 03:28:33,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +21: [2023-05-13 03:28:33,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +21: [2023-05-13 03:28:33,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +21: [2023-05-13 03:28:33,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +21: [2023-05-13 03:28:33,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +29: [2023-05-13 03:28:33,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +29: [2023-05-13 03:28:33,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +28: [2023-05-13 03:28:33,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +28: [2023-05-13 03:28:33,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +28: [2023-05-13 03:28:33,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +10: [2023-05-13 03:28:33,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +11: [2023-05-13 03:28:33,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +10: [2023-05-13 03:28:33,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +10: [2023-05-13 03:28:33,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +10: [2023-05-13 03:28:33,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +10: [2023-05-13 03:28:33,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +10: [2023-05-13 03:28:33,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +10: [2023-05-13 03:28:33,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +10: [2023-05-13 03:28:33,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +22: [2023-05-13 03:28:33,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +22: [2023-05-13 03:28:33,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +10: [2023-05-13 03:28:33,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +22: [2023-05-13 03:28:33,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +22: [2023-05-13 03:28:33,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +10: [2023-05-13 03:28:33,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +28: [2023-05-13 03:28:33,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +28: [2023-05-13 03:28:33,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +28: [2023-05-13 03:28:33,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +28: [2023-05-13 03:28:33,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 0: [2023-05-13 03:28:33,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +17: [2023-05-13 03:28:33,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +10: [2023-05-13 03:28:33,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +10: [2023-05-13 03:28:33,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +10: [2023-05-13 03:28:33,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +22: [2023-05-13 03:28:33,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +11: [2023-05-13 03:28:33,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +10: [2023-05-13 03:28:33,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +22: [2023-05-13 03:28:33,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +10: [2023-05-13 03:28:33,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +10: [2023-05-13 03:28:33,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +11: [2023-05-13 03:28:33,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +11: [2023-05-13 03:28:33,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +29: [2023-05-13 03:28:33,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +29: [2023-05-13 03:28:33,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +29: [2023-05-13 03:28:33,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +11: [2023-05-13 03:28:33,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +29: [2023-05-13 03:28:33,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +29: [2023-05-13 03:28:33,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +20: [2023-05-13 03:28:33,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +20: [2023-05-13 03:28:33,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +11: [2023-05-13 03:28:33,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +11: [2023-05-13 03:28:33,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +29: [2023-05-13 03:28:33,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +29: [2023-05-13 03:28:33,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +29: [2023-05-13 03:28:33,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +30: [2023-05-13 03:28:33,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +30: [2023-05-13 03:28:33,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +15: [2023-05-13 03:28:33,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +30: [2023-05-13 03:28:33,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +30: [2023-05-13 03:28:33,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +30: [2023-05-13 03:28:33,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +30: [2023-05-13 03:28:33,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +15: [2023-05-13 03:28:33,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +15: [2023-05-13 03:28:33,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +15: [2023-05-13 03:28:33,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +15: [2023-05-13 03:28:33,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +15: [2023-05-13 03:28:33,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +15: [2023-05-13 03:28:33,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +30: [2023-05-13 03:28:33,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +15: [2023-05-13 03:28:33,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +30: [2023-05-13 03:28:33,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +20: [2023-05-13 03:28:33,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +15: [2023-05-13 03:28:33,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +17: [2023-05-13 03:28:33,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +28: [2023-05-13 03:28:33,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +30: [2023-05-13 03:28:33,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +30: [2023-05-13 03:28:33,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +30: [2023-05-13 03:28:33,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +30: [2023-05-13 03:28:33,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +30: [2023-05-13 03:28:33,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +28: [2023-05-13 03:28:33,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +30: [2023-05-13 03:28:33,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +30: [2023-05-13 03:28:33,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +30: [2023-05-13 03:28:33,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +15: [2023-05-13 03:28:33,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +28: [2023-05-13 03:28:33,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +17: [2023-05-13 03:28:33,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +15: [2023-05-13 03:28:33,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +15: [2023-05-13 03:28:33,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +15: [2023-05-13 03:28:33,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +15: [2023-05-13 03:28:33,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +28: [2023-05-13 03:28:33,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +28: [2023-05-13 03:28:33,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +15: [2023-05-13 03:28:33,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +15: [2023-05-13 03:28:33,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +20: [2023-05-13 03:28:33,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +20: [2023-05-13 03:28:33,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +20: [2023-05-13 03:28:33,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +21: [2023-05-13 03:28:33,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +21: [2023-05-13 03:28:33,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +21: [2023-05-13 03:28:33,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +28: [2023-05-13 03:28:33,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +28: [2023-05-13 03:28:33,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +29: [2023-05-13 03:28:33,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +20: [2023-05-13 03:28:33,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +20: [2023-05-13 03:28:33,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +29: [2023-05-13 03:28:33,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +29: [2023-05-13 03:28:33,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +20: [2023-05-13 03:28:33,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +20: [2023-05-13 03:28:33,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +10: [2023-05-13 03:28:33,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 0: [2023-05-13 03:28:33,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 0: [2023-05-13 03:28:33,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +29: [2023-05-13 03:28:33,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +21: [2023-05-13 03:28:33,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +21: [2023-05-13 03:28:33,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:33,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +17: [2023-05-13 03:28:33,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +21: [2023-05-13 03:28:33,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +21: [2023-05-13 03:28:33,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +21: [2023-05-13 03:28:33,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 0: [2023-05-13 03:28:33,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 0: [2023-05-13 03:28:33,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 0: [2023-05-13 03:28:33,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 0: [2023-05-13 03:28:33,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +29: [2023-05-13 03:28:33,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +29: [2023-05-13 03:28:33,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +20: [2023-05-13 03:28:33,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:33,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +10: [2023-05-13 03:28:33,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:33,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +17: [2023-05-13 03:28:33,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +17: [2023-05-13 03:28:33,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +17: [2023-05-13 03:28:33,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +21: [2023-05-13 03:28:33,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +21: [2023-05-13 03:28:33,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +21: [2023-05-13 03:28:33,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +10: [2023-05-13 03:28:33,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +20: [2023-05-13 03:28:33,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +20: [2023-05-13 03:28:33,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +13: [2023-05-13 03:28:33,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +13: [2023-05-13 03:28:33,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +13: [2023-05-13 03:28:33,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +13: [2023-05-13 03:28:33,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +13: [2023-05-13 03:28:33,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +13: [2023-05-13 03:28:33,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +13: [2023-05-13 03:28:33,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +13: [2023-05-13 03:28:33,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +20: [2023-05-13 03:28:33,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +13: [2023-05-13 03:28:33,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +13: [2023-05-13 03:28:33,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +13: [2023-05-13 03:28:33,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +20: [2023-05-13 03:28:33,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +20: [2023-05-13 03:28:33,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +13: [2023-05-13 03:28:33,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +13: [2023-05-13 03:28:33,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +10: [2023-05-13 03:28:33,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +15: [2023-05-13 03:28:33,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +13: [2023-05-13 03:28:33,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +13: [2023-05-13 03:28:33,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +21: [2023-05-13 03:28:33,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +10: [2023-05-13 03:28:33,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +10: [2023-05-13 03:28:33,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +10: [2023-05-13 03:28:33,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +10: [2023-05-13 03:28:33,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +10: [2023-05-13 03:28:33,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +24: [2023-05-13 03:28:33,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +24: [2023-05-13 03:28:33,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +24: [2023-05-13 03:28:33,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +13: [2023-05-13 03:28:33,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +24: [2023-05-13 03:28:33,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +10: [2023-05-13 03:28:33,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +24: [2023-05-13 03:28:33,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +24: [2023-05-13 03:28:33,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +24: [2023-05-13 03:28:33,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +24: [2023-05-13 03:28:33,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +24: [2023-05-13 03:28:33,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +24: [2023-05-13 03:28:33,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +24: [2023-05-13 03:28:33,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +24: [2023-05-13 03:28:33,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +24: [2023-05-13 03:28:33,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +24: [2023-05-13 03:28:33,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +24: [2023-05-13 03:28:33,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +24: [2023-05-13 03:28:33,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +30: [2023-05-13 03:28:33,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +30: [2023-05-13 03:28:33,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +21: [2023-05-13 03:28:33,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +21: [2023-05-13 03:28:33,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +30: [2023-05-13 03:28:33,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +21: [2023-05-13 03:28:33,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +21: [2023-05-13 03:28:33,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +27: [2023-05-13 03:28:33,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:33,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +27: [2023-05-13 03:28:33,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +27: [2023-05-13 03:28:33,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:33,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +27: [2023-05-13 03:28:33,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +27: [2023-05-13 03:28:33,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +27: [2023-05-13 03:28:33,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +27: [2023-05-13 03:28:33,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +27: [2023-05-13 03:28:33,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:33,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +27: [2023-05-13 03:28:33,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +17: [2023-05-13 03:28:33,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +27: [2023-05-13 03:28:33,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +30: [2023-05-13 03:28:33,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:33,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +17: [2023-05-13 03:28:33,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +30: [2023-05-13 03:28:33,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +30: [2023-05-13 03:28:33,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +30: [2023-05-13 03:28:33,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +30: [2023-05-13 03:28:33,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +15: [2023-05-13 03:28:33,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +15: [2023-05-13 03:28:33,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +27: [2023-05-13 03:28:33,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +27: [2023-05-13 03:28:33,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 4: [2023-05-13 03:28:33,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 4: [2023-05-13 03:28:33,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 4: [2023-05-13 03:28:33,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 4: [2023-05-13 03:28:33,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 4: [2023-05-13 03:28:33,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 4: [2023-05-13 03:28:33,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +27: [2023-05-13 03:28:33,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 4: [2023-05-13 03:28:33,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 4: [2023-05-13 03:28:33,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +27: [2023-05-13 03:28:33,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +27: [2023-05-13 03:28:33,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +27: [2023-05-13 03:28:33,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 4: [2023-05-13 03:28:33,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +10: [2023-05-13 03:28:33,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 4: [2023-05-13 03:28:33,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 4: [2023-05-13 03:28:33,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 4: [2023-05-13 03:28:33,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 4: [2023-05-13 03:28:33,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 4: [2023-05-13 03:28:33,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 4: [2023-05-13 03:28:33,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 4: [2023-05-13 03:28:33,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +30: [2023-05-13 03:28:33,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +30: [2023-05-13 03:28:33,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +10: [2023-05-13 03:28:33,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +30: [2023-05-13 03:28:33,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +10: [2023-05-13 03:28:33,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +10: [2023-05-13 03:28:33,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +10: [2023-05-13 03:28:33,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +10: [2023-05-13 03:28:33,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +15: [2023-05-13 03:28:33,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +15: [2023-05-13 03:28:33,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +15: [2023-05-13 03:28:33,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +15: [2023-05-13 03:28:33,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +15: [2023-05-13 03:28:33,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +15: [2023-05-13 03:28:33,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +16: [2023-05-13 03:28:33,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +16: [2023-05-13 03:28:33,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +16: [2023-05-13 03:28:33,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +16: [2023-05-13 03:28:33,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +16: [2023-05-13 03:28:33,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +16: [2023-05-13 03:28:33,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +16: [2023-05-13 03:28:33,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +16: [2023-05-13 03:28:33,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +13: [2023-05-13 03:28:33,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +19: [2023-05-13 03:28:33,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +19: [2023-05-13 03:28:33,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +19: [2023-05-13 03:28:33,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +19: [2023-05-13 03:28:33,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +19: [2023-05-13 03:28:33,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +19: [2023-05-13 03:28:33,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +19: [2023-05-13 03:28:33,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +19: [2023-05-13 03:28:33,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +25: [2023-05-13 03:28:33,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +25: [2023-05-13 03:28:33,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +25: [2023-05-13 03:28:33,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +25: [2023-05-13 03:28:33,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +25: [2023-05-13 03:28:33,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +25: [2023-05-13 03:28:33,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +25: [2023-05-13 03:28:33,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +25: [2023-05-13 03:28:33,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +15: [2023-05-13 03:28:33,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +30: [2023-05-13 03:28:33,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +16: [2023-05-13 03:28:33,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +16: [2023-05-13 03:28:33,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +30: [2023-05-13 03:28:33,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +25: [2023-05-13 03:28:33,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +19: [2023-05-13 03:28:33,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +25: [2023-05-13 03:28:33,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +16: [2023-05-13 03:28:33,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +16: [2023-05-13 03:28:33,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +16: [2023-05-13 03:28:33,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +25: [2023-05-13 03:28:33,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +16: [2023-05-13 03:28:33,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +16: [2023-05-13 03:28:33,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +19: [2023-05-13 03:28:33,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +16: [2023-05-13 03:28:33,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +19: [2023-05-13 03:28:33,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +23: [2023-05-13 03:28:33,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +23: [2023-05-13 03:28:33,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +23: [2023-05-13 03:28:33,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +23: [2023-05-13 03:28:33,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +23: [2023-05-13 03:28:33,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +23: [2023-05-13 03:28:33,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +23: [2023-05-13 03:28:33,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +30: [2023-05-13 03:28:33,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +19: [2023-05-13 03:28:33,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +19: [2023-05-13 03:28:33,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +23: [2023-05-13 03:28:33,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +30: [2023-05-13 03:28:33,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +19: [2023-05-13 03:28:33,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +25: [2023-05-13 03:28:33,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +25: [2023-05-13 03:28:33,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +19: [2023-05-13 03:28:33,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +30: [2023-05-13 03:28:33,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +19: [2023-05-13 03:28:33,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +25: [2023-05-13 03:28:33,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +25: [2023-05-13 03:28:33,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +25: [2023-05-13 03:28:33,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +23: [2023-05-13 03:28:33,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +13: [2023-05-13 03:28:33,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +13: [2023-05-13 03:28:33,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +13: [2023-05-13 03:28:33,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +23: [2023-05-13 03:28:33,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +27: [2023-05-13 03:28:33,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +24: [2023-05-13 03:28:33,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +24: [2023-05-13 03:28:33,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +24: [2023-05-13 03:28:33,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +13: [2023-05-13 03:28:33,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +23: [2023-05-13 03:28:33,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +23: [2023-05-13 03:28:33,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +23: [2023-05-13 03:28:33,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +23: [2023-05-13 03:28:33,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +23: [2023-05-13 03:28:33,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +12: [2023-05-13 03:28:33,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +12: [2023-05-13 03:28:33,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +12: [2023-05-13 03:28:33,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +12: [2023-05-13 03:28:33,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +12: [2023-05-13 03:28:33,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +12: [2023-05-13 03:28:33,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +12: [2023-05-13 03:28:33,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +23: [2023-05-13 03:28:33,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +12: [2023-05-13 03:28:33,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +13: [2023-05-13 03:28:33,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +24: [2023-05-13 03:28:33,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +24: [2023-05-13 03:28:33,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:33,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +12: [2023-05-13 03:28:33,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:33,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +12: [2023-05-13 03:28:33,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +12: [2023-05-13 03:28:33,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +12: [2023-05-13 03:28:33,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +12: [2023-05-13 03:28:33,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +12: [2023-05-13 03:28:33,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +24: [2023-05-13 03:28:33,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +24: [2023-05-13 03:28:33,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +24: [2023-05-13 03:28:33,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +13: [2023-05-13 03:28:33,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +15: [2023-05-13 03:28:33,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +13: [2023-05-13 03:28:33,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +13: [2023-05-13 03:28:33,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +15: [2023-05-13 03:28:33,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 4: [2023-05-13 03:28:33,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +13: [2023-05-13 03:28:33,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +27: [2023-05-13 03:28:33,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +15: [2023-05-13 03:28:33,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +15: [2023-05-13 03:28:33,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +13: [2023-05-13 03:28:33,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 5: [2023-05-13 03:28:33,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +15: [2023-05-13 03:28:33,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +27: [2023-05-13 03:28:33,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 5: [2023-05-13 03:28:33,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +15: [2023-05-13 03:28:33,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +13: [2023-05-13 03:28:33,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +24: [2023-05-13 03:28:33,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 4: [2023-05-13 03:28:33,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 4: [2023-05-13 03:28:33,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +24: [2023-05-13 03:28:33,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +13: [2023-05-13 03:28:33,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +24: [2023-05-13 03:28:33,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 4: [2023-05-13 03:28:33,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 4: [2023-05-13 03:28:33,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 4: [2023-05-13 03:28:33,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 4: [2023-05-13 03:28:33,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 4: [2023-05-13 03:28:33,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +24: [2023-05-13 03:28:33,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +24: [2023-05-13 03:28:33,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +31: [2023-05-13 03:28:33,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +31: [2023-05-13 03:28:33,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +19: [2023-05-13 03:28:33,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 4: [2023-05-13 03:28:33,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +16: [2023-05-13 03:28:33,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +16: [2023-05-13 03:28:33,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +31: [2023-05-13 03:28:33,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +31: [2023-05-13 03:28:33,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +31: [2023-05-13 03:28:33,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +31: [2023-05-13 03:28:33,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +31: [2023-05-13 03:28:33,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +31: [2023-05-13 03:28:33,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +31: [2023-05-13 03:28:33,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +23: [2023-05-13 03:28:33,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +24: [2023-05-13 03:28:33,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +31: [2023-05-13 03:28:33,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +24: [2023-05-13 03:28:33,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +13: [2023-05-13 03:28:33,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +13: [2023-05-13 03:28:33,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +24: [2023-05-13 03:28:33,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +13: [2023-05-13 03:28:33,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +25: [2023-05-13 03:28:33,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +25: [2023-05-13 03:28:33,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +25: [2023-05-13 03:28:33,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +16: [2023-05-13 03:28:33,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +16: [2023-05-13 03:28:33,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +27: [2023-05-13 03:28:33,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +22: [2023-05-13 03:28:33,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +22: [2023-05-13 03:28:33,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +27: [2023-05-13 03:28:33,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +11: [2023-05-13 03:28:33,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +25: [2023-05-13 03:28:33,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +31: [2023-05-13 03:28:33,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +27: [2023-05-13 03:28:33,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +11: [2023-05-13 03:28:33,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +11: [2023-05-13 03:28:33,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +11: [2023-05-13 03:28:33,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +31: [2023-05-13 03:28:33,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +11: [2023-05-13 03:28:33,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +11: [2023-05-13 03:28:33,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +11: [2023-05-13 03:28:33,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +18: [2023-05-13 03:28:33,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +18: [2023-05-13 03:28:33,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +11: [2023-05-13 03:28:33,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +31: [2023-05-13 03:28:33,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +16: [2023-05-13 03:28:33,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +16: [2023-05-13 03:28:33,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +22: [2023-05-13 03:28:33,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +22: [2023-05-13 03:28:33,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +18: [2023-05-13 03:28:33,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +22: [2023-05-13 03:28:33,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +22: [2023-05-13 03:28:33,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +22: [2023-05-13 03:28:33,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +31: [2023-05-13 03:28:33,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +22: [2023-05-13 03:28:33,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +29: [2023-05-13 03:28:33,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +29: [2023-05-13 03:28:33,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +18: [2023-05-13 03:28:33,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +18: [2023-05-13 03:28:33,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +18: [2023-05-13 03:28:33,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +31: [2023-05-13 03:28:33,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +19: [2023-05-13 03:28:33,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +31: [2023-05-13 03:28:33,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +14: [2023-05-13 03:28:33,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +14: [2023-05-13 03:28:33,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +23: [2023-05-13 03:28:33,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +14: [2023-05-13 03:28:33,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +14: [2023-05-13 03:28:33,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +14: [2023-05-13 03:28:33,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +14: [2023-05-13 03:28:33,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +14: [2023-05-13 03:28:33,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +22: [2023-05-13 03:28:33,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +14: [2023-05-13 03:28:33,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +11: [2023-05-13 03:28:33,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +27: [2023-05-13 03:28:33,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +27: [2023-05-13 03:28:33,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +27: [2023-05-13 03:28:33,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +27: [2023-05-13 03:28:33,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +16: [2023-05-13 03:28:33,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +22: [2023-05-13 03:28:33,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +29: [2023-05-13 03:28:33,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +29: [2023-05-13 03:28:33,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +29: [2023-05-13 03:28:33,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +29: [2023-05-13 03:28:33,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +29: [2023-05-13 03:28:33,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +29: [2023-05-13 03:28:33,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +29: [2023-05-13 03:28:33,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +18: [2023-05-13 03:28:33,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +12: [2023-05-13 03:28:33,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +18: [2023-05-13 03:28:33,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +29: [2023-05-13 03:28:33,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +16: [2023-05-13 03:28:33,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +25: [2023-05-13 03:28:33,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 4: [2023-05-13 03:28:33,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 4: [2023-05-13 03:28:33,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +19: [2023-05-13 03:28:33,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +14: [2023-05-13 03:28:33,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +14: [2023-05-13 03:28:33,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +14: [2023-05-13 03:28:33,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 4: [2023-05-13 03:28:33,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +18: [2023-05-13 03:28:33,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +22: [2023-05-13 03:28:33,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +19: [2023-05-13 03:28:33,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +19: [2023-05-13 03:28:33,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +19: [2023-05-13 03:28:33,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +19: [2023-05-13 03:28:33,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +14: [2023-05-13 03:28:33,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +14: [2023-05-13 03:28:33,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +19: [2023-05-13 03:28:33,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +11: [2023-05-13 03:28:33,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +22: [2023-05-13 03:28:33,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +14: [2023-05-13 03:28:33,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +25: [2023-05-13 03:28:33,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +25: [2023-05-13 03:28:33,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +22: [2023-05-13 03:28:33,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +11: [2023-05-13 03:28:33,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +22: [2023-05-13 03:28:33,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +14: [2023-05-13 03:28:33,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +22: [2023-05-13 03:28:33,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 4: [2023-05-13 03:28:33,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 4: [2023-05-13 03:28:33,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +11: [2023-05-13 03:28:33,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +14: [2023-05-13 03:28:33,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +22: [2023-05-13 03:28:33,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +11: [2023-05-13 03:28:33,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +25: [2023-05-13 03:28:33,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +11: [2023-05-13 03:28:33,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +11: [2023-05-13 03:28:33,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +19: [2023-05-13 03:28:33,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +23: [2023-05-13 03:28:33,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 4: [2023-05-13 03:28:33,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +23: [2023-05-13 03:28:33,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +29: [2023-05-13 03:28:33,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +11: [2023-05-13 03:28:33,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 7: [2023-05-13 03:28:33,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +29: [2023-05-13 03:28:33,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +16: [2023-05-13 03:28:33,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 4: [2023-05-13 03:28:33,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +29: [2023-05-13 03:28:33,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +29: [2023-05-13 03:28:33,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +29: [2023-05-13 03:28:33,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +29: [2023-05-13 03:28:33,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +16: [2023-05-13 03:28:33,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:33,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +12: [2023-05-13 03:28:33,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:33,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +12: [2023-05-13 03:28:33,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +25: [2023-05-13 03:28:33,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +25: [2023-05-13 03:28:33,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +25: [2023-05-13 03:28:33,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +16: [2023-05-13 03:28:33,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +16: [2023-05-13 03:28:33,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +25: [2023-05-13 03:28:33,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 9: [2023-05-13 03:28:33,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 9: [2023-05-13 03:28:33,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 9: [2023-05-13 03:28:33,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 9: [2023-05-13 03:28:33,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +23: [2023-05-13 03:28:33,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +23: [2023-05-13 03:28:33,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +23: [2023-05-13 03:28:33,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 9: [2023-05-13 03:28:33,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 9: [2023-05-13 03:28:33,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 9: [2023-05-13 03:28:33,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +16: [2023-05-13 03:28:33,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +16: [2023-05-13 03:28:33,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +23: [2023-05-13 03:28:33,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 9: [2023-05-13 03:28:33,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +23: [2023-05-13 03:28:33,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +23: [2023-05-13 03:28:33,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +12: [2023-05-13 03:28:33,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 9: [2023-05-13 03:28:33,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +19: [2023-05-13 03:28:33,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +27: [2023-05-13 03:28:33,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:33,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +12: [2023-05-13 03:28:33,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +12: [2023-05-13 03:28:33,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +16: [2023-05-13 03:28:33,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +16: [2023-05-13 03:28:33,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +31: [2023-05-13 03:28:33,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 9: [2023-05-13 03:28:33,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 9: [2023-05-13 03:28:33,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 9: [2023-05-13 03:28:33,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 9: [2023-05-13 03:28:33,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +23: [2023-05-13 03:28:33,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +27: [2023-05-13 03:28:33,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +27: [2023-05-13 03:28:33,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +25: [2023-05-13 03:28:33,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 9: [2023-05-13 03:28:33,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 9: [2023-05-13 03:28:33,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... + 9: [2023-05-13 03:28:33,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +19: [2023-05-13 03:28:33,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +19: [2023-05-13 03:28:33,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +25: [2023-05-13 03:28:33,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +27: [2023-05-13 03:28:33,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +27: [2023-05-13 03:28:33,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +25: [2023-05-13 03:28:33,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +25: [2023-05-13 03:28:33,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +19: [2023-05-13 03:28:33,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +19: [2023-05-13 03:28:33,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +27: [2023-05-13 03:28:33,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +19: [2023-05-13 03:28:33,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 6: [2023-05-13 03:28:33,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:33,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +19: [2023-05-13 03:28:33,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 7: [2023-05-13 03:28:33,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:33,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +12: [2023-05-13 03:28:33,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +29: [2023-05-13 03:28:33,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +22: [2023-05-13 03:28:33,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +18: [2023-05-13 03:28:33,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +12: [2023-05-13 03:28:33,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +31: [2023-05-13 03:28:33,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +11: [2023-05-13 03:28:33,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 2: [2023-05-13 03:28:33,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 8: [2023-05-13 03:28:33,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 2: [2023-05-13 03:28:33,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +23: [2023-05-13 03:28:33,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +14: [2023-05-13 03:28:33,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +14: [2023-05-13 03:28:33,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +31: [2023-05-13 03:28:33,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +23: [2023-05-13 03:28:33,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 8: [2023-05-13 03:28:33,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +23: [2023-05-13 03:28:33,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:33,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +12: [2023-05-13 03:28:33,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +12: [2023-05-13 03:28:33,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +26: [2023-05-13 03:28:33,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +26: [2023-05-13 03:28:33,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +26: [2023-05-13 03:28:33,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +26: [2023-05-13 03:28:33,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +26: [2023-05-13 03:28:33,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +22: [2023-05-13 03:28:33,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +26: [2023-05-13 03:28:33,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +26: [2023-05-13 03:28:33,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +26: [2023-05-13 03:28:33,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +29: [2023-05-13 03:28:33,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +23: [2023-05-13 03:28:33,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +31: [2023-05-13 03:28:33,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +23: [2023-05-13 03:28:33,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +18: [2023-05-13 03:28:33,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +17: [2023-05-13 03:28:33,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +26: [2023-05-13 03:28:33,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +26: [2023-05-13 03:28:33,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +28: [2023-05-13 03:28:33,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +28: [2023-05-13 03:28:33,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +26: [2023-05-13 03:28:33,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +17: [2023-05-13 03:28:33,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:33,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:33,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:33,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:33,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:33,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:33,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +26: [2023-05-13 03:28:33,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +28: [2023-05-13 03:28:33,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +28: [2023-05-13 03:28:33,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +28: [2023-05-13 03:28:33,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +18: [2023-05-13 03:28:33,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +28: [2023-05-13 03:28:33,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +28: [2023-05-13 03:28:33,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +14: [2023-05-13 03:28:33,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +28: [2023-05-13 03:28:33,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +18: [2023-05-13 03:28:33,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +14: [2023-05-13 03:28:33,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 6: [2023-05-13 03:28:33,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +26: [2023-05-13 03:28:33,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +29: [2023-05-13 03:28:33,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +26: [2023-05-13 03:28:33,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +28: [2023-05-13 03:28:33,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +26: [2023-05-13 03:28:33,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +17: [2023-05-13 03:28:33,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +26: [2023-05-13 03:28:33,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt... +18: [2023-05-13 03:28:33,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +11: [2023-05-13 03:28:33,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +28: [2023-05-13 03:28:33,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +22: [2023-05-13 03:28:33,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +31: [2023-05-13 03:28:33,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +31: [2023-05-13 03:28:33,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +31: [2023-05-13 03:28:33,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +11: [2023-05-13 03:28:33,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:33,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +28: [2023-05-13 03:28:33,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +17: [2023-05-13 03:28:33,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +14: [2023-05-13 03:28:33,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:33,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 9: [2023-05-13 03:28:33,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +18: [2023-05-13 03:28:33,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +18: [2023-05-13 03:28:33,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +18: [2023-05-13 03:28:33,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:33,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +14: [2023-05-13 03:28:33,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +28: [2023-05-13 03:28:33,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +28: [2023-05-13 03:28:33,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +17: [2023-05-13 03:28:33,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +28: [2023-05-13 03:28:33,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +17: [2023-05-13 03:28:33,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +14: [2023-05-13 03:28:33,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +28: [2023-05-13 03:28:33,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +17: [2023-05-13 03:28:33,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +22: [2023-05-13 03:28:33,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +22: [2023-05-13 03:28:33,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +28: [2023-05-13 03:28:33,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +14: [2023-05-13 03:28:33,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +14: [2023-05-13 03:28:33,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +14: [2023-05-13 03:28:33,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +29: [2023-05-13 03:28:33,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +22: [2023-05-13 03:28:33,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +22: [2023-05-13 03:28:33,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +22: [2023-05-13 03:28:33,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +22: [2023-05-13 03:28:33,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +29: [2023-05-13 03:28:33,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +29: [2023-05-13 03:28:33,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +29: [2023-05-13 03:28:33,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +29: [2023-05-13 03:28:33,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +29: [2023-05-13 03:28:33,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +29: [2023-05-13 03:28:33,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +22: [2023-05-13 03:28:33,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +18: [2023-05-13 03:28:33,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +11: [2023-05-13 03:28:33,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +11: [2023-05-13 03:28:33,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +11: [2023-05-13 03:28:33,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 1: [2023-05-13 03:28:33,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +18: [2023-05-13 03:28:33,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 1: [2023-05-13 03:28:33,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +14: [2023-05-13 03:28:33,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +11: [2023-05-13 03:28:33,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +11: [2023-05-13 03:28:33,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +11: [2023-05-13 03:28:33,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +18: [2023-05-13 03:28:33,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 3: [2023-05-13 03:28:33,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +14: [2023-05-13 03:28:33,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +20: [2023-05-13 03:28:33,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +20: [2023-05-13 03:28:33,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +20: [2023-05-13 03:28:33,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +20: [2023-05-13 03:28:33,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +20: [2023-05-13 03:28:33,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +20: [2023-05-13 03:28:33,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +20: [2023-05-13 03:28:33,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +20: [2023-05-13 03:28:33,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +11: [2023-05-13 03:28:33,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 9: [2023-05-13 03:28:33,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 0: [2023-05-13 03:28:33,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 0: [2023-05-13 03:28:33,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 0: [2023-05-13 03:28:33,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 0: [2023-05-13 03:28:33,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 0: [2023-05-13 03:28:33,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 0: [2023-05-13 03:28:33,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +18: [2023-05-13 03:28:33,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +20: [2023-05-13 03:28:33,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +20: [2023-05-13 03:28:33,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +20: [2023-05-13 03:28:33,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +20: [2023-05-13 03:28:33,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +20: [2023-05-13 03:28:33,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +14: [2023-05-13 03:28:33,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +20: [2023-05-13 03:28:33,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +18: [2023-05-13 03:28:33,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +18: [2023-05-13 03:28:33,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +20: [2023-05-13 03:28:33,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +20: [2023-05-13 03:28:33,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +14: [2023-05-13 03:28:33,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +14: [2023-05-13 03:28:33,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +22: [2023-05-13 03:28:33,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +22: [2023-05-13 03:28:33,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +14: [2023-05-13 03:28:33,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 0: [2023-05-13 03:28:33,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 9: [2023-05-13 03:28:33,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 9: [2023-05-13 03:28:33,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 9: [2023-05-13 03:28:33,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 9: [2023-05-13 03:28:33,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 9: [2023-05-13 03:28:33,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. + 9: [2023-05-13 03:28:33,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +22: [2023-05-13 03:28:33,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +22: [2023-05-13 03:28:33,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +31: [2023-05-13 03:28:33,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +31: [2023-05-13 03:28:33,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +31: [2023-05-13 03:28:33,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +31: [2023-05-13 03:28:33,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +31: [2023-05-13 03:28:33,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +31: [2023-05-13 03:28:33,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +29: [2023-05-13 03:28:33,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +31: [2023-05-13 03:28:33,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +31: [2023-05-13 03:28:33,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +31: [2023-05-13 03:28:33,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +17: [2023-05-13 03:28:33,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +22: [2023-05-13 03:28:33,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 9: [2023-05-13 03:28:33,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +29: [2023-05-13 03:28:33,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +22: [2023-05-13 03:28:33,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +29: [2023-05-13 03:28:33,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +28: [2023-05-13 03:28:33,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +29: [2023-05-13 03:28:33,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +26: [2023-05-13 03:28:33,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +26: [2023-05-13 03:28:33,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +26: [2023-05-13 03:28:33,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +26: [2023-05-13 03:28:33,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +29: [2023-05-13 03:28:33,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +11: [2023-05-13 03:28:33,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +29: [2023-05-13 03:28:33,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +11: [2023-05-13 03:28:33,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +11: [2023-05-13 03:28:33,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +11: [2023-05-13 03:28:33,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +11: [2023-05-13 03:28:33,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 3: [2023-05-13 03:28:33,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +11: [2023-05-13 03:28:34,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +26: [2023-05-13 03:28:34,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +26: [2023-05-13 03:28:34,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +26: [2023-05-13 03:28:34,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +26: [2023-05-13 03:28:34,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_26-model_00-model_states.pt. +28: [2023-05-13 03:28:34,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +28: [2023-05-13 03:28:34,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:34,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +26: [2023-05-13 03:28:34,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +26: [2023-05-13 03:28:34,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +26: [2023-05-13 03:28:34,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +28: [2023-05-13 03:28:34,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +26: [2023-05-13 03:28:34,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +17: [2023-05-13 03:28:34,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +17: [2023-05-13 03:28:34,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +20: [2023-05-13 03:28:34,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +20: [2023-05-13 03:28:34,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +17: [2023-05-13 03:28:34,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +28: [2023-05-13 03:28:34,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +28: [2023-05-13 03:28:34,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:34,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:34,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:34,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:34,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +28: [2023-05-13 03:28:34,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +26: [2023-05-13 03:28:34,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +26: [2023-05-13 03:28:34,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +26: [2023-05-13 03:28:34,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +28: [2023-05-13 03:28:34,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +28: [2023-05-13 03:28:34,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +28: [2023-05-13 03:28:34,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +26: [2023-05-13 03:28:34,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +17: [2023-05-13 03:28:34,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +28: [2023-05-13 03:28:34,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +20: [2023-05-13 03:28:34,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +20: [2023-05-13 03:28:34,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +20: [2023-05-13 03:28:34,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +20: [2023-05-13 03:28:34,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +20: [2023-05-13 03:28:34,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +20: [2023-05-13 03:28:34,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +20: [2023-05-13 03:28:34,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +20: [2023-05-13 03:28:34,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +17: [2023-05-13 03:28:34,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +28: [2023-05-13 03:28:34,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +28: [2023-05-13 03:28:34,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:34,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +17: [2023-05-13 03:28:34,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +17: [2023-05-13 03:28:34,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +17: [2023-05-13 03:28:34,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +28: [2023-05-13 03:28:34,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +28: [2023-05-13 03:28:34,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +28: [2023-05-13 03:28:34,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +25: [2023-05-13 03:28:34,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +25: [2023-05-13 03:28:34,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +25: [2023-05-13 03:28:34,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +25: [2023-05-13 03:28:34,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +25: [2023-05-13 03:28:34,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +25: [2023-05-13 03:28:34,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +25: [2023-05-13 03:28:34,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +25: [2023-05-13 03:28:34,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +17: [2023-05-13 03:28:34,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:34,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +12: [2023-05-13 03:28:34,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +12: [2023-05-13 03:28:34,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +12: [2023-05-13 03:28:34,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +12: [2023-05-13 03:28:34,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +12: [2023-05-13 03:28:34,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +12: [2023-05-13 03:28:34,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +12: [2023-05-13 03:28:34,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +25: [2023-05-13 03:28:34,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +25: [2023-05-13 03:28:34,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +25: [2023-05-13 03:28:34,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +25: [2023-05-13 03:28:34,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +12: [2023-05-13 03:28:34,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +12: [2023-05-13 03:28:34,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +12: [2023-05-13 03:28:34,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +25: [2023-05-13 03:28:34,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +12: [2023-05-13 03:28:34,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +20: [2023-05-13 03:28:34,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +12: [2023-05-13 03:28:34,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +12: [2023-05-13 03:28:34,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +25: [2023-05-13 03:28:34,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +12: [2023-05-13 03:28:34,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +12: [2023-05-13 03:28:34,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +25: [2023-05-13 03:28:34,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +25: [2023-05-13 03:28:34,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +20: [2023-05-13 03:28:34,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +20: [2023-05-13 03:28:34,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +20: [2023-05-13 03:28:34,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +20: [2023-05-13 03:28:34,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +20: [2023-05-13 03:28:34,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +10: [2023-05-13 03:28:34,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +10: [2023-05-13 03:28:34,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +10: [2023-05-13 03:28:34,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +10: [2023-05-13 03:28:34,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +10: [2023-05-13 03:28:34,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +10: [2023-05-13 03:28:34,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +10: [2023-05-13 03:28:34,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +10: [2023-05-13 03:28:34,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +25: [2023-05-13 03:28:34,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +10: [2023-05-13 03:28:34,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +10: [2023-05-13 03:28:34,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +10: [2023-05-13 03:28:34,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +10: [2023-05-13 03:28:34,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +10: [2023-05-13 03:28:34,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +10: [2023-05-13 03:28:34,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +10: [2023-05-13 03:28:34,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +10: [2023-05-13 03:28:34,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +25: [2023-05-13 03:28:34,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +25: [2023-05-13 03:28:34,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +25: [2023-05-13 03:28:34,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +12: [2023-05-13 03:28:34,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +12: [2023-05-13 03:28:34,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +12: [2023-05-13 03:28:34,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +12: [2023-05-13 03:28:34,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +12: [2023-05-13 03:28:34,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +25: [2023-05-13 03:28:34,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +25: [2023-05-13 03:28:34,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +25: [2023-05-13 03:28:34,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:34,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +12: [2023-05-13 03:28:34,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +30: [2023-05-13 03:28:34,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +12: [2023-05-13 03:28:34,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +30: [2023-05-13 03:28:34,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +30: [2023-05-13 03:28:34,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +30: [2023-05-13 03:28:34,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +30: [2023-05-13 03:28:34,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +30: [2023-05-13 03:28:34,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +30: [2023-05-13 03:28:34,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +30: [2023-05-13 03:28:34,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +21: [2023-05-13 03:28:34,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +21: [2023-05-13 03:28:34,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +21: [2023-05-13 03:28:34,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +21: [2023-05-13 03:28:34,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +21: [2023-05-13 03:28:34,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +21: [2023-05-13 03:28:34,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +21: [2023-05-13 03:28:34,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +21: [2023-05-13 03:28:34,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +25: [2023-05-13 03:28:34,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +25: [2023-05-13 03:28:34,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +30: [2023-05-13 03:28:34,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +30: [2023-05-13 03:28:34,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +30: [2023-05-13 03:28:34,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +15: [2023-05-13 03:28:34,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +15: [2023-05-13 03:28:34,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +15: [2023-05-13 03:28:34,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +15: [2023-05-13 03:28:34,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +15: [2023-05-13 03:28:34,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +15: [2023-05-13 03:28:34,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +15: [2023-05-13 03:28:34,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +21: [2023-05-13 03:28:34,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +15: [2023-05-13 03:28:34,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +30: [2023-05-13 03:28:34,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +21: [2023-05-13 03:28:34,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +30: [2023-05-13 03:28:34,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +30: [2023-05-13 03:28:34,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +21: [2023-05-13 03:28:34,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +30: [2023-05-13 03:28:34,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +30: [2023-05-13 03:28:34,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +21: [2023-05-13 03:28:34,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +15: [2023-05-13 03:28:34,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +21: [2023-05-13 03:28:34,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +21: [2023-05-13 03:28:34,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +25: [2023-05-13 03:28:34,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +25: [2023-05-13 03:28:34,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +21: [2023-05-13 03:28:34,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +21: [2023-05-13 03:28:34,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:34,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +25: [2023-05-13 03:28:34,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 7: [2023-05-13 03:28:34,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 7: [2023-05-13 03:28:34,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 7: [2023-05-13 03:28:34,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 7: [2023-05-13 03:28:34,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 7: [2023-05-13 03:28:34,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 7: [2023-05-13 03:28:34,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +25: [2023-05-13 03:28:34,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +12: [2023-05-13 03:28:34,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:34,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +15: [2023-05-13 03:28:34,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +15: [2023-05-13 03:28:34,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +15: [2023-05-13 03:28:34,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +15: [2023-05-13 03:28:34,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:34,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +15: [2023-05-13 03:28:34,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:34,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +15: [2023-05-13 03:28:34,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +15: [2023-05-13 03:28:34,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:34,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:34,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:34,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +25: [2023-05-13 03:28:34,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +25: [2023-05-13 03:28:34,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +10: [2023-05-13 03:28:34,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +25: [2023-05-13 03:28:34,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +10: [2023-05-13 03:28:34,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +24: [2023-05-13 03:28:34,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +24: [2023-05-13 03:28:34,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +24: [2023-05-13 03:28:34,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +24: [2023-05-13 03:28:34,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +24: [2023-05-13 03:28:34,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +24: [2023-05-13 03:28:34,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +24: [2023-05-13 03:28:34,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +24: [2023-05-13 03:28:34,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +24: [2023-05-13 03:28:34,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +24: [2023-05-13 03:28:34,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +23: [2023-05-13 03:28:34,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +23: [2023-05-13 03:28:34,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +24: [2023-05-13 03:28:34,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +24: [2023-05-13 03:28:34,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +23: [2023-05-13 03:28:34,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +24: [2023-05-13 03:28:34,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +23: [2023-05-13 03:28:34,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +23: [2023-05-13 03:28:34,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +24: [2023-05-13 03:28:34,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +24: [2023-05-13 03:28:34,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +23: [2023-05-13 03:28:34,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +23: [2023-05-13 03:28:34,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +23: [2023-05-13 03:28:34,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +24: [2023-05-13 03:28:34,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +10: [2023-05-13 03:28:34,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +23: [2023-05-13 03:28:34,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +10: [2023-05-13 03:28:34,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +23: [2023-05-13 03:28:34,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +10: [2023-05-13 03:28:34,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +10: [2023-05-13 03:28:34,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +23: [2023-05-13 03:28:34,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +23: [2023-05-13 03:28:34,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +23: [2023-05-13 03:28:34,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +21: [2023-05-13 03:28:34,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +23: [2023-05-13 03:28:34,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +23: [2023-05-13 03:28:34,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +23: [2023-05-13 03:28:34,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +30: [2023-05-13 03:28:34,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +30: [2023-05-13 03:28:34,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +10: [2023-05-13 03:28:34,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +10: [2023-05-13 03:28:34,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +10: [2023-05-13 03:28:34,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +10: [2023-05-13 03:28:34,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +15: [2023-05-13 03:28:34,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +30: [2023-05-13 03:28:34,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +30: [2023-05-13 03:28:34,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +21: [2023-05-13 03:28:34,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +21: [2023-05-13 03:28:34,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +26: [2023-05-13 03:28:34,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +26: [2023-05-13 03:28:34,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +21: [2023-05-13 03:28:34,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +21: [2023-05-13 03:28:34,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +26: [2023-05-13 03:28:34,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +26: [2023-05-13 03:28:34,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +26: [2023-05-13 03:28:34,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +26: [2023-05-13 03:28:34,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +26: [2023-05-13 03:28:34,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +26: [2023-05-13 03:28:34,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +10: [2023-05-13 03:28:34,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +21: [2023-05-13 03:28:34,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +21: [2023-05-13 03:28:34,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +21: [2023-05-13 03:28:34,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +26: [2023-05-13 03:28:34,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +26: [2023-05-13 03:28:34,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +30: [2023-05-13 03:28:34,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +30: [2023-05-13 03:28:34,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +30: [2023-05-13 03:28:34,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +30: [2023-05-13 03:28:34,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +30: [2023-05-13 03:28:34,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +26: [2023-05-13 03:28:34,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +15: [2023-05-13 03:28:34,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +21: [2023-05-13 03:28:34,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +26: [2023-05-13 03:28:34,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +26: [2023-05-13 03:28:34,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +15: [2023-05-13 03:28:34,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +16: [2023-05-13 03:28:34,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +16: [2023-05-13 03:28:34,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +16: [2023-05-13 03:28:34,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +16: [2023-05-13 03:28:34,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +16: [2023-05-13 03:28:34,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +16: [2023-05-13 03:28:34,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +16: [2023-05-13 03:28:34,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +30: [2023-05-13 03:28:34,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +16: [2023-05-13 03:28:34,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +30: [2023-05-13 03:28:34,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +30: [2023-05-13 03:28:34,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +10: [2023-05-13 03:28:34,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt... +21: [2023-05-13 03:28:34,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +21: [2023-05-13 03:28:34,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +10: [2023-05-13 03:28:34,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +10: [2023-05-13 03:28:34,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +16: [2023-05-13 03:28:34,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +16: [2023-05-13 03:28:34,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +16: [2023-05-13 03:28:34,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +16: [2023-05-13 03:28:34,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 7: [2023-05-13 03:28:34,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 7: [2023-05-13 03:28:34,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 7: [2023-05-13 03:28:34,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +16: [2023-05-13 03:28:34,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +16: [2023-05-13 03:28:34,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +16: [2023-05-13 03:28:34,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +16: [2023-05-13 03:28:34,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +10: [2023-05-13 03:28:34,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +10: [2023-05-13 03:28:34,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +15: [2023-05-13 03:28:34,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +15: [2023-05-13 03:28:34,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +15: [2023-05-13 03:28:34,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +15: [2023-05-13 03:28:34,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +15: [2023-05-13 03:28:34,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +24: [2023-05-13 03:28:34,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +24: [2023-05-13 03:28:34,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +24: [2023-05-13 03:28:34,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +15: [2023-05-13 03:28:34,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +23: [2023-05-13 03:28:34,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +23: [2023-05-13 03:28:34,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +24: [2023-05-13 03:28:34,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +21: [2023-05-13 03:28:34,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +21: [2023-05-13 03:28:34,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +15: [2023-05-13 03:28:34,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +30: [2023-05-13 03:28:34,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +21: [2023-05-13 03:28:34,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +24: [2023-05-13 03:28:34,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +24: [2023-05-13 03:28:34,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +24: [2023-05-13 03:28:34,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +21: [2023-05-13 03:28:34,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +21: [2023-05-13 03:28:34,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +30: [2023-05-13 03:28:34,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +30: [2023-05-13 03:28:34,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +30: [2023-05-13 03:28:34,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +24: [2023-05-13 03:28:34,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 7: [2023-05-13 03:28:34,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +24: [2023-05-13 03:28:34,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +23: [2023-05-13 03:28:34,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +23: [2023-05-13 03:28:34,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +23: [2023-05-13 03:28:34,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +23: [2023-05-13 03:28:34,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +23: [2023-05-13 03:28:34,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +23: [2023-05-13 03:28:34,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +24: [2023-05-13 03:28:34,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +15: [2023-05-13 03:28:34,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +26: [2023-05-13 03:28:34,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +24: [2023-05-13 03:28:34,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +23: [2023-05-13 03:28:34,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +23: [2023-05-13 03:28:34,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +15: [2023-05-13 03:28:34,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +15: [2023-05-13 03:28:34,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +13: [2023-05-13 03:28:34,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +13: [2023-05-13 03:28:34,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +13: [2023-05-13 03:28:34,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +13: [2023-05-13 03:28:34,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +13: [2023-05-13 03:28:34,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +13: [2023-05-13 03:28:34,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +13: [2023-05-13 03:28:34,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +15: [2023-05-13 03:28:34,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +24: [2023-05-13 03:28:34,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +13: [2023-05-13 03:28:34,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +24: [2023-05-13 03:28:34,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 8: [2023-05-13 03:28:34,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +15: [2023-05-13 03:28:34,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +15: [2023-05-13 03:28:34,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +22: [2023-05-13 03:28:34,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +22: [2023-05-13 03:28:34,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +22: [2023-05-13 03:28:34,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +22: [2023-05-13 03:28:34,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +22: [2023-05-13 03:28:34,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +22: [2023-05-13 03:28:34,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +22: [2023-05-13 03:28:34,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +22: [2023-05-13 03:28:34,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +11: [2023-05-13 03:28:34,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +26: [2023-05-13 03:28:34,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +11: [2023-05-13 03:28:34,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +11: [2023-05-13 03:28:34,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +11: [2023-05-13 03:28:34,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +24: [2023-05-13 03:28:34,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +11: [2023-05-13 03:28:34,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +11: [2023-05-13 03:28:34,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +11: [2023-05-13 03:28:34,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +11: [2023-05-13 03:28:34,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +24: [2023-05-13 03:28:34,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 8: [2023-05-13 03:28:34,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 8: [2023-05-13 03:28:34,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +13: [2023-05-13 03:28:34,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +13: [2023-05-13 03:28:34,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +13: [2023-05-13 03:28:34,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +16: [2023-05-13 03:28:34,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +16: [2023-05-13 03:28:34,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +13: [2023-05-13 03:28:34,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +24: [2023-05-13 03:28:34,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +13: [2023-05-13 03:28:34,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +11: [2023-05-13 03:28:34,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +26: [2023-05-13 03:28:34,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +26: [2023-05-13 03:28:34,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +26: [2023-05-13 03:28:34,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +13: [2023-05-13 03:28:34,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +13: [2023-05-13 03:28:34,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +22: [2023-05-13 03:28:34,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +22: [2023-05-13 03:28:34,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +13: [2023-05-13 03:28:34,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 8: [2023-05-13 03:28:34,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 8: [2023-05-13 03:28:34,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +22: [2023-05-13 03:28:34,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +22: [2023-05-13 03:28:34,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 8: [2023-05-13 03:28:34,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 8: [2023-05-13 03:28:34,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 8: [2023-05-13 03:28:34,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +22: [2023-05-13 03:28:34,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +22: [2023-05-13 03:28:34,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +22: [2023-05-13 03:28:34,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 8: [2023-05-13 03:28:34,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +22: [2023-05-13 03:28:34,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +26: [2023-05-13 03:28:34,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +26: [2023-05-13 03:28:34,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +29: [2023-05-13 03:28:34,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +29: [2023-05-13 03:28:34,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +16: [2023-05-13 03:28:34,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +16: [2023-05-13 03:28:34,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +16: [2023-05-13 03:28:34,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +29: [2023-05-13 03:28:34,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +29: [2023-05-13 03:28:34,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +29: [2023-05-13 03:28:34,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +29: [2023-05-13 03:28:34,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +29: [2023-05-13 03:28:34,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +29: [2023-05-13 03:28:34,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +11: [2023-05-13 03:28:34,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +19: [2023-05-13 03:28:34,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +19: [2023-05-13 03:28:34,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +19: [2023-05-13 03:28:34,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +19: [2023-05-13 03:28:34,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +11: [2023-05-13 03:28:34,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +19: [2023-05-13 03:28:34,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +19: [2023-05-13 03:28:34,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +31: [2023-05-13 03:28:34,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +19: [2023-05-13 03:28:34,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +31: [2023-05-13 03:28:34,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +19: [2023-05-13 03:28:34,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +11: [2023-05-13 03:28:34,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +11: [2023-05-13 03:28:34,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +11: [2023-05-13 03:28:34,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +27: [2023-05-13 03:28:34,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +27: [2023-05-13 03:28:34,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +27: [2023-05-13 03:28:34,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +18: [2023-05-13 03:28:34,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +18: [2023-05-13 03:28:34,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +18: [2023-05-13 03:28:34,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +27: [2023-05-13 03:28:34,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +27: [2023-05-13 03:28:34,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +27: [2023-05-13 03:28:34,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +27: [2023-05-13 03:28:34,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +27: [2023-05-13 03:28:34,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +11: [2023-05-13 03:28:34,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +18: [2023-05-13 03:28:34,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +11: [2023-05-13 03:28:34,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +16: [2023-05-13 03:28:34,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +29: [2023-05-13 03:28:34,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +18: [2023-05-13 03:28:34,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +18: [2023-05-13 03:28:34,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +18: [2023-05-13 03:28:34,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +29: [2023-05-13 03:28:34,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +18: [2023-05-13 03:28:34,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +31: [2023-05-13 03:28:34,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +31: [2023-05-13 03:28:34,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +31: [2023-05-13 03:28:34,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +31: [2023-05-13 03:28:34,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +31: [2023-05-13 03:28:34,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +31: [2023-05-13 03:28:34,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +31: [2023-05-13 03:28:34,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +31: [2023-05-13 03:28:34,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +26: [2023-05-13 03:28:34,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. +19: [2023-05-13 03:28:34,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +27: [2023-05-13 03:28:34,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +18: [2023-05-13 03:28:34,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +18: [2023-05-13 03:28:34,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +19: [2023-05-13 03:28:34,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +19: [2023-05-13 03:28:34,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +19: [2023-05-13 03:28:34,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +19: [2023-05-13 03:28:34,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +18: [2023-05-13 03:28:34,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +19: [2023-05-13 03:28:34,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +16: [2023-05-13 03:28:34,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +16: [2023-05-13 03:28:34,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +29: [2023-05-13 03:28:34,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +23: [2023-05-13 03:28:34,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +29: [2023-05-13 03:28:34,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +19: [2023-05-13 03:28:34,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +29: [2023-05-13 03:28:34,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +19: [2023-05-13 03:28:34,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +23: [2023-05-13 03:28:34,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +23: [2023-05-13 03:28:34,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +23: [2023-05-13 03:28:34,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +23: [2023-05-13 03:28:34,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +29: [2023-05-13 03:28:34,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +29: [2023-05-13 03:28:34,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +29: [2023-05-13 03:28:34,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +18: [2023-05-13 03:28:34,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +18: [2023-05-13 03:28:34,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +23: [2023-05-13 03:28:34,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +27: [2023-05-13 03:28:34,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +14: [2023-05-13 03:28:34,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +14: [2023-05-13 03:28:34,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +18: [2023-05-13 03:28:34,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +14: [2023-05-13 03:28:34,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +14: [2023-05-13 03:28:34,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +14: [2023-05-13 03:28:34,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +14: [2023-05-13 03:28:34,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +14: [2023-05-13 03:28:34,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +18: [2023-05-13 03:28:34,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +14: [2023-05-13 03:28:34,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +18: [2023-05-13 03:28:34,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +16: [2023-05-13 03:28:34,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +31: [2023-05-13 03:28:34,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +31: [2023-05-13 03:28:34,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +31: [2023-05-13 03:28:34,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +31: [2023-05-13 03:28:34,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +27: [2023-05-13 03:28:34,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +27: [2023-05-13 03:28:34,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +26: [2023-05-13 03:28:34,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +31: [2023-05-13 03:28:34,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +16: [2023-05-13 03:28:34,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +27: [2023-05-13 03:28:34,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +31: [2023-05-13 03:28:34,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +27: [2023-05-13 03:28:34,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +27: [2023-05-13 03:28:34,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +26: [2023-05-13 03:28:34,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +26: [2023-05-13 03:28:34,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +14: [2023-05-13 03:28:34,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +14: [2023-05-13 03:28:34,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +14: [2023-05-13 03:28:34,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +26: [2023-05-13 03:28:34,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +14: [2023-05-13 03:28:34,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +14: [2023-05-13 03:28:34,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +27: [2023-05-13 03:28:34,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +14: [2023-05-13 03:28:34,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +14: [2023-05-13 03:28:34,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +14: [2023-05-13 03:28:34,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +26: [2023-05-13 03:28:34,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_27-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +16: [2023-05-13 03:28:34,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +16: [2023-05-13 03:28:34,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +16: [2023-05-13 03:28:34,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +16: [2023-05-13 03:28:34,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +16: [2023-05-13 03:28:34,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +16: [2023-05-13 03:28:34,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +11: [2023-05-13 03:28:34,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +13: [2023-05-13 03:28:34,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +13: [2023-05-13 03:28:34,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +22: [2023-05-13 03:28:34,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +13: [2023-05-13 03:28:34,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +22: [2023-05-13 03:28:34,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +26: [2023-05-13 03:28:34,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +31: [2023-05-13 03:28:34,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +22: [2023-05-13 03:28:34,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +13: [2023-05-13 03:28:34,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +13: [2023-05-13 03:28:34,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +13: [2023-05-13 03:28:34,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +13: [2023-05-13 03:28:34,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +13: [2023-05-13 03:28:34,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +29: [2023-05-13 03:28:34,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +29: [2023-05-13 03:28:34,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +18: [2023-05-13 03:28:34,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 3: [2023-05-13 03:28:34,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 3: [2023-05-13 03:28:34,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +11: [2023-05-13 03:28:34,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +31: [2023-05-13 03:28:34,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +27: [2023-05-13 03:28:34,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +19: [2023-05-13 03:28:34,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 3: [2023-05-13 03:28:34,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 3: [2023-05-13 03:28:34,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 3: [2023-05-13 03:28:34,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 3: [2023-05-13 03:28:34,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 3: [2023-05-13 03:28:34,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 3: [2023-05-13 03:28:34,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +19: [2023-05-13 03:28:34,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +19: [2023-05-13 03:28:34,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 3: [2023-05-13 03:28:34,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 8: [2023-05-13 03:28:34,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +18: [2023-05-13 03:28:34,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +13: [2023-05-13 03:28:34,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +13: [2023-05-13 03:28:34,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +29: [2023-05-13 03:28:34,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +19: [2023-05-13 03:28:34,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +19: [2023-05-13 03:28:34,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +18: [2023-05-13 03:28:34,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +22: [2023-05-13 03:28:34,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +18: [2023-05-13 03:28:34,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 3: [2023-05-13 03:28:34,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +14: [2023-05-13 03:28:34,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +14: [2023-05-13 03:28:34,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +11: [2023-05-13 03:28:34,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +11: [2023-05-13 03:28:34,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +11: [2023-05-13 03:28:34,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +13: [2023-05-13 03:28:34,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +29: [2023-05-13 03:28:34,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +29: [2023-05-13 03:28:34,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +14: [2023-05-13 03:28:34,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +22: [2023-05-13 03:28:34,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +31: [2023-05-13 03:28:34,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +29: [2023-05-13 03:28:34,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +22: [2023-05-13 03:28:34,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +22: [2023-05-13 03:28:34,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +22: [2023-05-13 03:28:34,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +22: [2023-05-13 03:28:34,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +11: [2023-05-13 03:28:34,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +11: [2023-05-13 03:28:34,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +11: [2023-05-13 03:28:34,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +19: [2023-05-13 03:28:34,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +19: [2023-05-13 03:28:34,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +11: [2023-05-13 03:28:34,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +29: [2023-05-13 03:28:34,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +18: [2023-05-13 03:28:34,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 8: [2023-05-13 03:28:34,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +22: [2023-05-13 03:28:34,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 8: [2023-05-13 03:28:34,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +18: [2023-05-13 03:28:34,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +28: [2023-05-13 03:28:34,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +31: [2023-05-13 03:28:34,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +28: [2023-05-13 03:28:34,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +28: [2023-05-13 03:28:34,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +27: [2023-05-13 03:28:34,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +28: [2023-05-13 03:28:34,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +28: [2023-05-13 03:28:34,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +28: [2023-05-13 03:28:34,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +28: [2023-05-13 03:28:34,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +19: [2023-05-13 03:28:34,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +28: [2023-05-13 03:28:34,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 8: [2023-05-13 03:28:34,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +28: [2023-05-13 03:28:34,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +22: [2023-05-13 03:28:34,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +13: [2023-05-13 03:28:34,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +17: [2023-05-13 03:28:34,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +27: [2023-05-13 03:28:34,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +18: [2023-05-13 03:28:34,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +18: [2023-05-13 03:28:34,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +18: [2023-05-13 03:28:34,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +17: [2023-05-13 03:28:34,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +17: [2023-05-13 03:28:34,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +17: [2023-05-13 03:28:34,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +17: [2023-05-13 03:28:34,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +17: [2023-05-13 03:28:34,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +17: [2023-05-13 03:28:34,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +13: [2023-05-13 03:28:34,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +17: [2023-05-13 03:28:34,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +31: [2023-05-13 03:28:34,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +31: [2023-05-13 03:28:34,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +31: [2023-05-13 03:28:34,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +31: [2023-05-13 03:28:34,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +31: [2023-05-13 03:28:34,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +31: [2023-05-13 03:28:34,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +13: [2023-05-13 03:28:34,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +29: [2023-05-13 03:28:34,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +14: [2023-05-13 03:28:34,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +14: [2023-05-13 03:28:34,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +14: [2023-05-13 03:28:34,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +14: [2023-05-13 03:28:34,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +14: [2023-05-13 03:28:34,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +17: [2023-05-13 03:28:34,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +13: [2023-05-13 03:28:34,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +13: [2023-05-13 03:28:34,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +19: [2023-05-13 03:28:34,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +19: [2023-05-13 03:28:34,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +28: [2023-05-13 03:28:34,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +28: [2023-05-13 03:28:34,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +28: [2023-05-13 03:28:34,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +28: [2023-05-13 03:28:34,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +27: [2023-05-13 03:28:34,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +28: [2023-05-13 03:28:34,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +18: [2023-05-13 03:28:34,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +28: [2023-05-13 03:28:34,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +28: [2023-05-13 03:28:34,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +29: [2023-05-13 03:28:34,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +29: [2023-05-13 03:28:34,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +17: [2023-05-13 03:28:34,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +17: [2023-05-13 03:28:34,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +14: [2023-05-13 03:28:34,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +18: [2023-05-13 03:28:34,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +29: [2023-05-13 03:28:34,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +17: [2023-05-13 03:28:34,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +14: [2023-05-13 03:28:34,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +27: [2023-05-13 03:28:34,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +17: [2023-05-13 03:28:34,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +19: [2023-05-13 03:28:34,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +19: [2023-05-13 03:28:34,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +22: [2023-05-13 03:28:34,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +17: [2023-05-13 03:28:34,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +18: [2023-05-13 03:28:34,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +17: [2023-05-13 03:28:34,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +17: [2023-05-13 03:28:34,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +14: [2023-05-13 03:28:34,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +19: [2023-05-13 03:28:34,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 1: [2023-05-13 03:28:34,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 8: [2023-05-13 03:28:34,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +22: [2023-05-13 03:28:34,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 8: [2023-05-13 03:28:34,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +29: [2023-05-13 03:28:34,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 1: [2023-05-13 03:28:34,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +22: [2023-05-13 03:28:34,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 1: [2023-05-13 03:28:34,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +29: [2023-05-13 03:28:34,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 1: [2023-05-13 03:28:34,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 1: [2023-05-13 03:28:34,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +11: [2023-05-13 03:28:34,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 1: [2023-05-13 03:28:34,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 1: [2023-05-13 03:28:34,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +22: [2023-05-13 03:28:34,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 1: [2023-05-13 03:28:34,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 8: [2023-05-13 03:28:34,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +19: [2023-05-13 03:28:34,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 8: [2023-05-13 03:28:34,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +19: [2023-05-13 03:28:34,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +22: [2023-05-13 03:28:34,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +19: [2023-05-13 03:28:34,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +27: [2023-05-13 03:28:34,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +27: [2023-05-13 03:28:34,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +27: [2023-05-13 03:28:34,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +27: [2023-05-13 03:28:34,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +11: [2023-05-13 03:28:34,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +11: [2023-05-13 03:28:34,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +18: [2023-05-13 03:28:34,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +29: [2023-05-13 03:28:34,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +18: [2023-05-13 03:28:34,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +18: [2023-05-13 03:28:34,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 3: [2023-05-13 03:28:34,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +11: [2023-05-13 03:28:34,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +14: [2023-05-13 03:28:34,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +18: [2023-05-13 03:28:34,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +27: [2023-05-13 03:28:34,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +31: [2023-05-13 03:28:34,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +14: [2023-05-13 03:28:34,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +11: [2023-05-13 03:28:34,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +11: [2023-05-13 03:28:34,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +11: [2023-05-13 03:28:34,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +27: [2023-05-13 03:28:34,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +14: [2023-05-13 03:28:34,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +14: [2023-05-13 03:28:34,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +31: [2023-05-13 03:28:34,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +31: [2023-05-13 03:28:34,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +29: [2023-05-13 03:28:34,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +31: [2023-05-13 03:28:34,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +12: [2023-05-13 03:28:34,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +29: [2023-05-13 03:28:34,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +12: [2023-05-13 03:28:34,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +12: [2023-05-13 03:28:34,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +12: [2023-05-13 03:28:34,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +12: [2023-05-13 03:28:34,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +12: [2023-05-13 03:28:34,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +12: [2023-05-13 03:28:34,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +31: [2023-05-13 03:28:34,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +12: [2023-05-13 03:28:34,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +31: [2023-05-13 03:28:34,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +14: [2023-05-13 03:28:34,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +27: [2023-05-13 03:28:34,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +12: [2023-05-13 03:28:34,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:34,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:34,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +28: [2023-05-13 03:28:34,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +12: [2023-05-13 03:28:34,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:34,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:34,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:34,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +12: [2023-05-13 03:28:34,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +20: [2023-05-13 03:28:34,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +20: [2023-05-13 03:28:34,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +20: [2023-05-13 03:28:34,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +20: [2023-05-13 03:28:34,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +20: [2023-05-13 03:28:34,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +20: [2023-05-13 03:28:34,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +20: [2023-05-13 03:28:34,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +17: [2023-05-13 03:28:34,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +20: [2023-05-13 03:28:34,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +20: [2023-05-13 03:28:34,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +20: [2023-05-13 03:28:34,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +20: [2023-05-13 03:28:34,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +20: [2023-05-13 03:28:34,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +27: [2023-05-13 03:28:34,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 3: [2023-05-13 03:28:34,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 3: [2023-05-13 03:28:34,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +27: [2023-05-13 03:28:34,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +28: [2023-05-13 03:28:34,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +27: [2023-05-13 03:28:34,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +27: [2023-05-13 03:28:34,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +20: [2023-05-13 03:28:34,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +20: [2023-05-13 03:28:34,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +20: [2023-05-13 03:28:34,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +20: [2023-05-13 03:28:34,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +25: [2023-05-13 03:28:34,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +25: [2023-05-13 03:28:34,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 3: [2023-05-13 03:28:34,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +25: [2023-05-13 03:28:34,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +25: [2023-05-13 03:28:34,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +25: [2023-05-13 03:28:34,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +25: [2023-05-13 03:28:34,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +25: [2023-05-13 03:28:34,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +25: [2023-05-13 03:28:34,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +17: [2023-05-13 03:28:34,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +25: [2023-05-13 03:28:34,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +25: [2023-05-13 03:28:34,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +25: [2023-05-13 03:28:34,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +28: [2023-05-13 03:28:34,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +28: [2023-05-13 03:28:34,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +17: [2023-05-13 03:28:34,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +17: [2023-05-13 03:28:34,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +25: [2023-05-13 03:28:34,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +25: [2023-05-13 03:28:34,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +25: [2023-05-13 03:28:34,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +25: [2023-05-13 03:28:34,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +25: [2023-05-13 03:28:34,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 1: [2023-05-13 03:28:34,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +28: [2023-05-13 03:28:34,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +28: [2023-05-13 03:28:34,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +28: [2023-05-13 03:28:34,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +28: [2023-05-13 03:28:34,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +28: [2023-05-13 03:28:34,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +12: [2023-05-13 03:28:34,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 1: [2023-05-13 03:28:34,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +17: [2023-05-13 03:28:34,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +17: [2023-05-13 03:28:34,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +17: [2023-05-13 03:28:34,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +17: [2023-05-13 03:28:34,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... + 1: [2023-05-13 03:28:34,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +12: [2023-05-13 03:28:34,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +12: [2023-05-13 03:28:34,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +17: [2023-05-13 03:28:34,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +17: [2023-05-13 03:28:34,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +17: [2023-05-13 03:28:34,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +12: [2023-05-13 03:28:34,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +12: [2023-05-13 03:28:34,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +20: [2023-05-13 03:28:34,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +20: [2023-05-13 03:28:34,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +28: [2023-05-13 03:28:34,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 1: [2023-05-13 03:28:34,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +12: [2023-05-13 03:28:34,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +28: [2023-05-13 03:28:34,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 1: [2023-05-13 03:28:34,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 1: [2023-05-13 03:28:34,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 1: [2023-05-13 03:28:34,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +28: [2023-05-13 03:28:34,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +12: [2023-05-13 03:28:34,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +12: [2023-05-13 03:28:34,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +12: [2023-05-13 03:28:34,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +28: [2023-05-13 03:28:34,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +28: [2023-05-13 03:28:34,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +28: [2023-05-13 03:28:34,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +28: [2023-05-13 03:28:34,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +20: [2023-05-13 03:28:34,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +20: [2023-05-13 03:28:34,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +17: [2023-05-13 03:28:34,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +17: [2023-05-13 03:28:34,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +17: [2023-05-13 03:28:34,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +17: [2023-05-13 03:28:34,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +25: [2023-05-13 03:28:34,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +25: [2023-05-13 03:28:34,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +25: [2023-05-13 03:28:34,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +12: [2023-05-13 03:28:34,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +20: [2023-05-13 03:28:34,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +12: [2023-05-13 03:28:34,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +20: [2023-05-13 03:28:34,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +12: [2023-05-13 03:28:34,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +12: [2023-05-13 03:28:34,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +20: [2023-05-13 03:28:34,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +17: [2023-05-13 03:28:34,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +25: [2023-05-13 03:28:34,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +12: [2023-05-13 03:28:34,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +20: [2023-05-13 03:28:34,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +20: [2023-05-13 03:28:34,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +25: [2023-05-13 03:28:34,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +25: [2023-05-13 03:28:34,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +25: [2023-05-13 03:28:34,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 4: [2023-05-13 03:28:34,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +25: [2023-05-13 03:28:34,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +12: [2023-05-13 03:28:34,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +12: [2023-05-13 03:28:34,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 4: [2023-05-13 03:28:34,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +26: [2023-05-13 03:28:34,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +26: [2023-05-13 03:28:34,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +26: [2023-05-13 03:28:34,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +26: [2023-05-13 03:28:34,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +26: [2023-05-13 03:28:34,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +26: [2023-05-13 03:28:34,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +26: [2023-05-13 03:28:34,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +25: [2023-05-13 03:28:34,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +20: [2023-05-13 03:28:34,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +20: [2023-05-13 03:28:34,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +20: [2023-05-13 03:28:34,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +25: [2023-05-13 03:28:34,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +26: [2023-05-13 03:28:34,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +25: [2023-05-13 03:28:34,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +26: [2023-05-13 03:28:34,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +26: [2023-05-13 03:28:34,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +20: [2023-05-13 03:28:34,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +26: [2023-05-13 03:28:34,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +26: [2023-05-13 03:28:34,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt... +25: [2023-05-13 03:28:34,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +20: [2023-05-13 03:28:34,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +20: [2023-05-13 03:28:34,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +25: [2023-05-13 03:28:34,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +25: [2023-05-13 03:28:34,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +25: [2023-05-13 03:28:34,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +25: [2023-05-13 03:28:34,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +20: [2023-05-13 03:28:34,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +26: [2023-05-13 03:28:34,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +26: [2023-05-13 03:28:34,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +26: [2023-05-13 03:28:34,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +26: [2023-05-13 03:28:34,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +26: [2023-05-13 03:28:34,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +26: [2023-05-13 03:28:34,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_28-model_00-model_states.pt. +26: [2023-05-13 03:28:34,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +10: [2023-05-13 03:28:34,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +10: [2023-05-13 03:28:34,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +10: [2023-05-13 03:28:34,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +10: [2023-05-13 03:28:34,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +10: [2023-05-13 03:28:34,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +10: [2023-05-13 03:28:34,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +10: [2023-05-13 03:28:34,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +10: [2023-05-13 03:28:34,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +26: [2023-05-13 03:28:34,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +10: [2023-05-13 03:28:34,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +10: [2023-05-13 03:28:34,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +10: [2023-05-13 03:28:34,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +10: [2023-05-13 03:28:34,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +10: [2023-05-13 03:28:34,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +10: [2023-05-13 03:28:34,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +10: [2023-05-13 03:28:34,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +10: [2023-05-13 03:28:34,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +10: [2023-05-13 03:28:34,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +10: [2023-05-13 03:28:34,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +24: [2023-05-13 03:28:34,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +24: [2023-05-13 03:28:34,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +24: [2023-05-13 03:28:34,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +24: [2023-05-13 03:28:34,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +24: [2023-05-13 03:28:34,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +24: [2023-05-13 03:28:34,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +24: [2023-05-13 03:28:34,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +24: [2023-05-13 03:28:34,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +24: [2023-05-13 03:28:34,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +24: [2023-05-13 03:28:34,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +24: [2023-05-13 03:28:34,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +11: [2023-05-13 03:28:34,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +30: [2023-05-13 03:28:34,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +30: [2023-05-13 03:28:34,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +30: [2023-05-13 03:28:34,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +30: [2023-05-13 03:28:34,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +30: [2023-05-13 03:28:34,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +30: [2023-05-13 03:28:34,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +30: [2023-05-13 03:28:34,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +24: [2023-05-13 03:28:34,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +11: [2023-05-13 03:28:34,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +11: [2023-05-13 03:28:34,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +11: [2023-05-13 03:28:34,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +11: [2023-05-13 03:28:34,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +11: [2023-05-13 03:28:34,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +11: [2023-05-13 03:28:34,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +24: [2023-05-13 03:28:34,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +11: [2023-05-13 03:28:34,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +30: [2023-05-13 03:28:34,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +24: [2023-05-13 03:28:34,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +24: [2023-05-13 03:28:34,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +24: [2023-05-13 03:28:34,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +11: [2023-05-13 03:28:34,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +30: [2023-05-13 03:28:34,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +30: [2023-05-13 03:28:34,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +30: [2023-05-13 03:28:34,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +11: [2023-05-13 03:28:34,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +30: [2023-05-13 03:28:34,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +30: [2023-05-13 03:28:34,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +30: [2023-05-13 03:28:34,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +30: [2023-05-13 03:28:34,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +30: [2023-05-13 03:28:34,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +10: [2023-05-13 03:28:34,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +11: [2023-05-13 03:28:34,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +10: [2023-05-13 03:28:34,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +10: [2023-05-13 03:28:34,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +11: [2023-05-13 03:28:34,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +11: [2023-05-13 03:28:34,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +11: [2023-05-13 03:28:34,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +10: [2023-05-13 03:28:34,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +10: [2023-05-13 03:28:34,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +10: [2023-05-13 03:28:34,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +10: [2023-05-13 03:28:34,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +10: [2023-05-13 03:28:34,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +11: [2023-05-13 03:28:34,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +11: [2023-05-13 03:28:34,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +10: [2023-05-13 03:28:34,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +10: [2023-05-13 03:28:34,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +10: [2023-05-13 03:28:34,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +10: [2023-05-13 03:28:34,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +10: [2023-05-13 03:28:34,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +10: [2023-05-13 03:28:34,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +11: [2023-05-13 03:28:34,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +24: [2023-05-13 03:28:34,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +24: [2023-05-13 03:28:34,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +24: [2023-05-13 03:28:34,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +27: [2023-05-13 03:28:34,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +30: [2023-05-13 03:28:34,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +30: [2023-05-13 03:28:34,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +27: [2023-05-13 03:28:34,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +27: [2023-05-13 03:28:34,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +27: [2023-05-13 03:28:34,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +27: [2023-05-13 03:28:34,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +27: [2023-05-13 03:28:34,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +27: [2023-05-13 03:28:34,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +27: [2023-05-13 03:28:34,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +24: [2023-05-13 03:28:34,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +13: [2023-05-13 03:28:34,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +13: [2023-05-13 03:28:34,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +13: [2023-05-13 03:28:34,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +13: [2023-05-13 03:28:34,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +13: [2023-05-13 03:28:34,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +13: [2023-05-13 03:28:34,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +13: [2023-05-13 03:28:34,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +30: [2023-05-13 03:28:34,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +27: [2023-05-13 03:28:34,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +13: [2023-05-13 03:28:34,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +24: [2023-05-13 03:28:34,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +13: [2023-05-13 03:28:34,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +13: [2023-05-13 03:28:34,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +13: [2023-05-13 03:28:34,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +13: [2023-05-13 03:28:34,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +30: [2023-05-13 03:28:34,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +27: [2023-05-13 03:28:34,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +27: [2023-05-13 03:28:34,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +27: [2023-05-13 03:28:34,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +13: [2023-05-13 03:28:34,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +13: [2023-05-13 03:28:34,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +27: [2023-05-13 03:28:34,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +24: [2023-05-13 03:28:34,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +24: [2023-05-13 03:28:34,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +24: [2023-05-13 03:28:34,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +27: [2023-05-13 03:28:34,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +11: [2023-05-13 03:28:34,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +13: [2023-05-13 03:28:34,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +13: [2023-05-13 03:28:34,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +27: [2023-05-13 03:28:34,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +27: [2023-05-13 03:28:34,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +15: [2023-05-13 03:28:34,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +15: [2023-05-13 03:28:34,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +15: [2023-05-13 03:28:34,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +15: [2023-05-13 03:28:34,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +15: [2023-05-13 03:28:34,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +15: [2023-05-13 03:28:34,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +15: [2023-05-13 03:28:34,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +30: [2023-05-13 03:28:34,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +30: [2023-05-13 03:28:34,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +30: [2023-05-13 03:28:34,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +30: [2023-05-13 03:28:34,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +15: [2023-05-13 03:28:34,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +11: [2023-05-13 03:28:34,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +15: [2023-05-13 03:28:34,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +19: [2023-05-13 03:28:34,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +19: [2023-05-13 03:28:34,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +19: [2023-05-13 03:28:34,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +19: [2023-05-13 03:28:34,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +19: [2023-05-13 03:28:34,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +19: [2023-05-13 03:28:34,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +19: [2023-05-13 03:28:34,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +19: [2023-05-13 03:28:34,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +11: [2023-05-13 03:28:34,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +30: [2023-05-13 03:28:34,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +30: [2023-05-13 03:28:34,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +19: [2023-05-13 03:28:34,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +15: [2023-05-13 03:28:34,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +19: [2023-05-13 03:28:34,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +19: [2023-05-13 03:28:34,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +19: [2023-05-13 03:28:34,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +19: [2023-05-13 03:28:34,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +19: [2023-05-13 03:28:34,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +19: [2023-05-13 03:28:34,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +19: [2023-05-13 03:28:34,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +15: [2023-05-13 03:28:34,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +15: [2023-05-13 03:28:34,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +15: [2023-05-13 03:28:34,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +15: [2023-05-13 03:28:34,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +11: [2023-05-13 03:28:34,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +11: [2023-05-13 03:28:34,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +11: [2023-05-13 03:28:34,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +15: [2023-05-13 03:28:34,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +15: [2023-05-13 03:28:34,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +30: [2023-05-13 03:28:34,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +30: [2023-05-13 03:28:34,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +11: [2023-05-13 03:28:34,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +11: [2023-05-13 03:28:34,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 5: [2023-05-13 03:28:34,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +30: [2023-05-13 03:28:34,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 5: [2023-05-13 03:28:34,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +30: [2023-05-13 03:28:34,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +30: [2023-05-13 03:28:34,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +30: [2023-05-13 03:28:34,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +11: [2023-05-13 03:28:34,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +11: [2023-05-13 03:28:34,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +13: [2023-05-13 03:28:34,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +24: [2023-05-13 03:28:34,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +24: [2023-05-13 03:28:34,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +24: [2023-05-13 03:28:34,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +24: [2023-05-13 03:28:34,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +24: [2023-05-13 03:28:34,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +24: [2023-05-13 03:28:34,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +24: [2023-05-13 03:28:34,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +24: [2023-05-13 03:28:34,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +27: [2023-05-13 03:28:34,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +11: [2023-05-13 03:28:34,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +11: [2023-05-13 03:28:34,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +11: [2023-05-13 03:28:34,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +13: [2023-05-13 03:28:34,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +13: [2023-05-13 03:28:34,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +15: [2023-05-13 03:28:34,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +13: [2023-05-13 03:28:34,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +13: [2023-05-13 03:28:34,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +11: [2023-05-13 03:28:34,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +11: [2023-05-13 03:28:34,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +13: [2023-05-13 03:28:34,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +13: [2023-05-13 03:28:34,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +19: [2023-05-13 03:28:34,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +27: [2023-05-13 03:28:34,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +19: [2023-05-13 03:28:34,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +19: [2023-05-13 03:28:34,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +19: [2023-05-13 03:28:34,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +13: [2023-05-13 03:28:34,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +27: [2023-05-13 03:28:34,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +13: [2023-05-13 03:28:34,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +27: [2023-05-13 03:28:34,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +19: [2023-05-13 03:28:34,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +19: [2023-05-13 03:28:34,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +19: [2023-05-13 03:28:34,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +19: [2023-05-13 03:28:34,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +15: [2023-05-13 03:28:34,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +29: [2023-05-13 03:28:34,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +29: [2023-05-13 03:28:34,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +29: [2023-05-13 03:28:34,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +29: [2023-05-13 03:28:34,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +29: [2023-05-13 03:28:34,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +29: [2023-05-13 03:28:34,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +29: [2023-05-13 03:28:34,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +29: [2023-05-13 03:28:34,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +29: [2023-05-13 03:28:34,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +13: [2023-05-13 03:28:34,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +29: [2023-05-13 03:28:34,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +13: [2023-05-13 03:28:34,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +18: [2023-05-13 03:28:34,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +18: [2023-05-13 03:28:34,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +18: [2023-05-13 03:28:34,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +18: [2023-05-13 03:28:34,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +18: [2023-05-13 03:28:34,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +18: [2023-05-13 03:28:34,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +18: [2023-05-13 03:28:34,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +18: [2023-05-13 03:28:34,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +27: [2023-05-13 03:28:34,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +27: [2023-05-13 03:28:34,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +27: [2023-05-13 03:28:34,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +27: [2023-05-13 03:28:34,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +27: [2023-05-13 03:28:34,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +13: [2023-05-13 03:28:34,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +22: [2023-05-13 03:28:34,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +22: [2023-05-13 03:28:34,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +22: [2023-05-13 03:28:34,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +22: [2023-05-13 03:28:34,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +22: [2023-05-13 03:28:34,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +22: [2023-05-13 03:28:34,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +22: [2023-05-13 03:28:34,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +22: [2023-05-13 03:28:34,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +13: [2023-05-13 03:28:34,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +18: [2023-05-13 03:28:34,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +15: [2023-05-13 03:28:34,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +15: [2023-05-13 03:28:34,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +15: [2023-05-13 03:28:34,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +29: [2023-05-13 03:28:34,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +29: [2023-05-13 03:28:34,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +18: [2023-05-13 03:28:34,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +15: [2023-05-13 03:28:34,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +18: [2023-05-13 03:28:34,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +29: [2023-05-13 03:28:34,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +22: [2023-05-13 03:28:34,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +29: [2023-05-13 03:28:34,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +18: [2023-05-13 03:28:34,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +29: [2023-05-13 03:28:34,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +29: [2023-05-13 03:28:34,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +22: [2023-05-13 03:28:34,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +18: [2023-05-13 03:28:34,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +15: [2023-05-13 03:28:34,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +15: [2023-05-13 03:28:34,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +18: [2023-05-13 03:28:34,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +18: [2023-05-13 03:28:34,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +19: [2023-05-13 03:28:34,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +18: [2023-05-13 03:28:34,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +13: [2023-05-13 03:28:34,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +22: [2023-05-13 03:28:34,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +22: [2023-05-13 03:28:34,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +31: [2023-05-13 03:28:34,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +22: [2023-05-13 03:28:34,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +31: [2023-05-13 03:28:34,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +22: [2023-05-13 03:28:34,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +31: [2023-05-13 03:28:34,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +31: [2023-05-13 03:28:34,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +31: [2023-05-13 03:28:34,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +31: [2023-05-13 03:28:34,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +31: [2023-05-13 03:28:34,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +22: [2023-05-13 03:28:34,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +31: [2023-05-13 03:28:34,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +22: [2023-05-13 03:28:34,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +15: [2023-05-13 03:28:34,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +19: [2023-05-13 03:28:34,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +31: [2023-05-13 03:28:34,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +27: [2023-05-13 03:28:34,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +19: [2023-05-13 03:28:34,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +31: [2023-05-13 03:28:34,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +13: [2023-05-13 03:28:34,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +19: [2023-05-13 03:28:34,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +19: [2023-05-13 03:28:34,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +19: [2023-05-13 03:28:34,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +13: [2023-05-13 03:28:34,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +31: [2023-05-13 03:28:34,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +27: [2023-05-13 03:28:34,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +19: [2023-05-13 03:28:34,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +19: [2023-05-13 03:28:34,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +31: [2023-05-13 03:28:34,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +31: [2023-05-13 03:28:34,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +14: [2023-05-13 03:28:34,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +14: [2023-05-13 03:28:34,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +14: [2023-05-13 03:28:34,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +14: [2023-05-13 03:28:34,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +14: [2023-05-13 03:28:34,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +14: [2023-05-13 03:28:34,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +14: [2023-05-13 03:28:34,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +14: [2023-05-13 03:28:34,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +31: [2023-05-13 03:28:34,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +31: [2023-05-13 03:28:34,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +31: [2023-05-13 03:28:34,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +14: [2023-05-13 03:28:34,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +14: [2023-05-13 03:28:34,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +14: [2023-05-13 03:28:34,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +14: [2023-05-13 03:28:34,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +14: [2023-05-13 03:28:34,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 7: [2023-05-13 03:28:34,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 7: [2023-05-13 03:28:34,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 7: [2023-05-13 03:28:34,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 7: [2023-05-13 03:28:34,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +14: [2023-05-13 03:28:34,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 7: [2023-05-13 03:28:34,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 7: [2023-05-13 03:28:34,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +14: [2023-05-13 03:28:34,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +14: [2023-05-13 03:28:34,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +27: [2023-05-13 03:28:34,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +27: [2023-05-13 03:28:34,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +15: [2023-05-13 03:28:34,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +27: [2023-05-13 03:28:34,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +27: [2023-05-13 03:28:34,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +27: [2023-05-13 03:28:34,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +15: [2023-05-13 03:28:34,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +15: [2023-05-13 03:28:34,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +29: [2023-05-13 03:28:34,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +15: [2023-05-13 03:28:34,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +15: [2023-05-13 03:28:34,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +15: [2023-05-13 03:28:34,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +15: [2023-05-13 03:28:34,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +18: [2023-05-13 03:28:34,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +21: [2023-05-13 03:28:34,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +21: [2023-05-13 03:28:34,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +21: [2023-05-13 03:28:34,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +21: [2023-05-13 03:28:34,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +21: [2023-05-13 03:28:34,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +21: [2023-05-13 03:28:34,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +21: [2023-05-13 03:28:34,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +21: [2023-05-13 03:28:34,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +29: [2023-05-13 03:28:34,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +23: [2023-05-13 03:28:34,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +23: [2023-05-13 03:28:34,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +23: [2023-05-13 03:28:34,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +23: [2023-05-13 03:28:34,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +23: [2023-05-13 03:28:34,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +23: [2023-05-13 03:28:34,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +23: [2023-05-13 03:28:34,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +23: [2023-05-13 03:28:34,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +21: [2023-05-13 03:28:34,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +21: [2023-05-13 03:28:34,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +21: [2023-05-13 03:28:34,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +21: [2023-05-13 03:28:34,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +21: [2023-05-13 03:28:34,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +23: [2023-05-13 03:28:34,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +22: [2023-05-13 03:28:34,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +22: [2023-05-13 03:28:34,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +21: [2023-05-13 03:28:34,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +21: [2023-05-13 03:28:34,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +23: [2023-05-13 03:28:34,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +21: [2023-05-13 03:28:34,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +31: [2023-05-13 03:28:34,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +18: [2023-05-13 03:28:34,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +23: [2023-05-13 03:28:34,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +23: [2023-05-13 03:28:34,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +18: [2023-05-13 03:28:34,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +18: [2023-05-13 03:28:34,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +16: [2023-05-13 03:28:34,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +16: [2023-05-13 03:28:34,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +16: [2023-05-13 03:28:34,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +16: [2023-05-13 03:28:34,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +16: [2023-05-13 03:28:34,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +16: [2023-05-13 03:28:34,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +16: [2023-05-13 03:28:34,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +23: [2023-05-13 03:28:34,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +16: [2023-05-13 03:28:34,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +29: [2023-05-13 03:28:34,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +23: [2023-05-13 03:28:34,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +23: [2023-05-13 03:28:34,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +23: [2023-05-13 03:28:34,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +16: [2023-05-13 03:28:34,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +16: [2023-05-13 03:28:34,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +18: [2023-05-13 03:28:34,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +16: [2023-05-13 03:28:34,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +16: [2023-05-13 03:28:34,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +16: [2023-05-13 03:28:34,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +16: [2023-05-13 03:28:34,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +18: [2023-05-13 03:28:34,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +29: [2023-05-13 03:28:34,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +29: [2023-05-13 03:28:34,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +16: [2023-05-13 03:28:34,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +16: [2023-05-13 03:28:34,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +29: [2023-05-13 03:28:34,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +14: [2023-05-13 03:28:34,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +14: [2023-05-13 03:28:34,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +31: [2023-05-13 03:28:34,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +28: [2023-05-13 03:28:34,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 0: [2023-05-13 03:28:34,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +29: [2023-05-13 03:28:34,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +29: [2023-05-13 03:28:34,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +29: [2023-05-13 03:28:34,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +29: [2023-05-13 03:28:34,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +28: [2023-05-13 03:28:34,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 2: [2023-05-13 03:28:34,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +18: [2023-05-13 03:28:34,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +18: [2023-05-13 03:28:34,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +18: [2023-05-13 03:28:34,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +28: [2023-05-13 03:28:34,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +28: [2023-05-13 03:28:34,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +28: [2023-05-13 03:28:34,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +28: [2023-05-13 03:28:34,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +28: [2023-05-13 03:28:34,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +28: [2023-05-13 03:28:34,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +28: [2023-05-13 03:28:34,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +22: [2023-05-13 03:28:34,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +31: [2023-05-13 03:28:34,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +22: [2023-05-13 03:28:34,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +22: [2023-05-13 03:28:34,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +22: [2023-05-13 03:28:34,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +22: [2023-05-13 03:28:34,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +22: [2023-05-13 03:28:34,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +22: [2023-05-13 03:28:34,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +22: [2023-05-13 03:28:34,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +31: [2023-05-13 03:28:34,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 1: [2023-05-13 03:28:34,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 1: [2023-05-13 03:28:34,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 1: [2023-05-13 03:28:34,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 1: [2023-05-13 03:28:34,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +18: [2023-05-13 03:28:34,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 1: [2023-05-13 03:28:34,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 1: [2023-05-13 03:28:34,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +18: [2023-05-13 03:28:34,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 1: [2023-05-13 03:28:34,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +18: [2023-05-13 03:28:34,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 0: [2023-05-13 03:28:34,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 8: [2023-05-13 03:28:34,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 8: [2023-05-13 03:28:34,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +14: [2023-05-13 03:28:34,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 3: [2023-05-13 03:28:34,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 3: [2023-05-13 03:28:34,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +28: [2023-05-13 03:28:34,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +28: [2023-05-13 03:28:34,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 8: [2023-05-13 03:28:34,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +25: [2023-05-13 03:28:34,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:34,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +25: [2023-05-13 03:28:34,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +25: [2023-05-13 03:28:34,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +25: [2023-05-13 03:28:34,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +25: [2023-05-13 03:28:34,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +25: [2023-05-13 03:28:34,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +25: [2023-05-13 03:28:34,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +25: [2023-05-13 03:28:34,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +28: [2023-05-13 03:28:34,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +20: [2023-05-13 03:28:34,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +20: [2023-05-13 03:28:34,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +28: [2023-05-13 03:28:34,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +28: [2023-05-13 03:28:34,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 3: [2023-05-13 03:28:34,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 3: [2023-05-13 03:28:34,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 3: [2023-05-13 03:28:34,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 3: [2023-05-13 03:28:34,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 3: [2023-05-13 03:28:34,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +28: [2023-05-13 03:28:34,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +28: [2023-05-13 03:28:34,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +20: [2023-05-13 03:28:34,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +20: [2023-05-13 03:28:34,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +20: [2023-05-13 03:28:34,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +20: [2023-05-13 03:28:34,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +20: [2023-05-13 03:28:34,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +20: [2023-05-13 03:28:34,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +25: [2023-05-13 03:28:34,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +26: [2023-05-13 03:28:34,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +25: [2023-05-13 03:28:34,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +20: [2023-05-13 03:28:34,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +25: [2023-05-13 03:28:34,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +20: [2023-05-13 03:28:34,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +25: [2023-05-13 03:28:34,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +31: [2023-05-13 03:28:34,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +14: [2023-05-13 03:28:34,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +26: [2023-05-13 03:28:34,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +26: [2023-05-13 03:28:34,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +26: [2023-05-13 03:28:34,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +25: [2023-05-13 03:28:34,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +12: [2023-05-13 03:28:34,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +31: [2023-05-13 03:28:34,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 9: [2023-05-13 03:28:34,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +12: [2023-05-13 03:28:34,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +12: [2023-05-13 03:28:34,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +12: [2023-05-13 03:28:34,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +12: [2023-05-13 03:28:34,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +12: [2023-05-13 03:28:34,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 9: [2023-05-13 03:28:34,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +12: [2023-05-13 03:28:34,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +12: [2023-05-13 03:28:34,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +14: [2023-05-13 03:28:34,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +14: [2023-05-13 03:28:34,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +14: [2023-05-13 03:28:34,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +14: [2023-05-13 03:28:34,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +14: [2023-05-13 03:28:34,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +29: [2023-05-13 03:28:34,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +26: [2023-05-13 03:28:34,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +14: [2023-05-13 03:28:34,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +25: [2023-05-13 03:28:34,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +25: [2023-05-13 03:28:34,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +25: [2023-05-13 03:28:34,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +18: [2023-05-13 03:28:34,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +29: [2023-05-13 03:28:34,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +20: [2023-05-13 03:28:34,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 3: [2023-05-13 03:28:34,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +31: [2023-05-13 03:28:34,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +31: [2023-05-13 03:28:34,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 3: [2023-05-13 03:28:34,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +20: [2023-05-13 03:28:34,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +17: [2023-05-13 03:28:34,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +17: [2023-05-13 03:28:34,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +17: [2023-05-13 03:28:34,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +31: [2023-05-13 03:28:34,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +31: [2023-05-13 03:28:34,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +17: [2023-05-13 03:28:34,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +17: [2023-05-13 03:28:34,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +17: [2023-05-13 03:28:34,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +17: [2023-05-13 03:28:34,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +17: [2023-05-13 03:28:34,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +20: [2023-05-13 03:28:34,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +20: [2023-05-13 03:28:34,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +20: [2023-05-13 03:28:34,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +20: [2023-05-13 03:28:34,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +12: [2023-05-13 03:28:34,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +12: [2023-05-13 03:28:34,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +12: [2023-05-13 03:28:34,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +18: [2023-05-13 03:28:34,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +12: [2023-05-13 03:28:34,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +26: [2023-05-13 03:28:34,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +12: [2023-05-13 03:28:34,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +12: [2023-05-13 03:28:34,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +12: [2023-05-13 03:28:34,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +18: [2023-05-13 03:28:34,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +26: [2023-05-13 03:28:34,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +17: [2023-05-13 03:28:34,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +23: [2023-05-13 03:28:34,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +31: [2023-05-13 03:28:34,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +12: [2023-05-13 03:28:34,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +29: [2023-05-13 03:28:34,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +18: [2023-05-13 03:28:34,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +26: [2023-05-13 03:28:34,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 7: [2023-05-13 03:28:34,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 7: [2023-05-13 03:28:34,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +23: [2023-05-13 03:28:34,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 6: [2023-05-13 03:28:34,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +26: [2023-05-13 03:28:34,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +21: [2023-05-13 03:28:34,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +21: [2023-05-13 03:28:34,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +29: [2023-05-13 03:28:34,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +29: [2023-05-13 03:28:34,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 6: [2023-05-13 03:28:34,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 7: [2023-05-13 03:28:34,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +21: [2023-05-13 03:28:34,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +21: [2023-05-13 03:28:34,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +21: [2023-05-13 03:28:34,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 7: [2023-05-13 03:28:34,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +29: [2023-05-13 03:28:34,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +22: [2023-05-13 03:28:34,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +22: [2023-05-13 03:28:34,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +17: [2023-05-13 03:28:34,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +17: [2023-05-13 03:28:34,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +17: [2023-05-13 03:28:34,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 2: [2023-05-13 03:28:34,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +17: [2023-05-13 03:28:34,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +17: [2023-05-13 03:28:34,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +17: [2023-05-13 03:28:34,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +14: [2023-05-13 03:28:34,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +17: [2023-05-13 03:28:34,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +22: [2023-05-13 03:28:34,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +22: [2023-05-13 03:28:34,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +16: [2023-05-13 03:28:34,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +16: [2023-05-13 03:28:34,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +22: [2023-05-13 03:28:34,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +22: [2023-05-13 03:28:35,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +23: [2023-05-13 03:28:35,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +31: [2023-05-13 03:28:35,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +16: [2023-05-13 03:28:35,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +16: [2023-05-13 03:28:35,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +14: [2023-05-13 03:28:35,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +28: [2023-05-13 03:28:35,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +21: [2023-05-13 03:28:35,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +21: [2023-05-13 03:28:35,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +21: [2023-05-13 03:28:35,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +16: [2023-05-13 03:28:35,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +23: [2023-05-13 03:28:35,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +23: [2023-05-13 03:28:35,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +21: [2023-05-13 03:28:35,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +14: [2023-05-13 03:28:35,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +14: [2023-05-13 03:28:35,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +14: [2023-05-13 03:28:35,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 0: [2023-05-13 03:28:35,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +31: [2023-05-13 03:28:35,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +31: [2023-05-13 03:28:35,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +14: [2023-05-13 03:28:35,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +21: [2023-05-13 03:28:35,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +21: [2023-05-13 03:28:35,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +31: [2023-05-13 03:28:35,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +31: [2023-05-13 03:28:35,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +21: [2023-05-13 03:28:35,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +16: [2023-05-13 03:28:35,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +21: [2023-05-13 03:28:35,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +16: [2023-05-13 03:28:35,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +16: [2023-05-13 03:28:35,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +23: [2023-05-13 03:28:35,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +23: [2023-05-13 03:28:35,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 3: [2023-05-13 03:28:35,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +23: [2023-05-13 03:28:35,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +23: [2023-05-13 03:28:35,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +23: [2023-05-13 03:28:35,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +25: [2023-05-13 03:28:35,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +16: [2023-05-13 03:28:35,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +16: [2023-05-13 03:28:35,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 8: [2023-05-13 03:28:35,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +28: [2023-05-13 03:28:35,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 1: [2023-05-13 03:28:35,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 3: [2023-05-13 03:28:35,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +23: [2023-05-13 03:28:35,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +26: [2023-05-13 03:28:35,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +26: [2023-05-13 03:28:35,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +20: [2023-05-13 03:28:35,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +20: [2023-05-13 03:28:35,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +16: [2023-05-13 03:28:35,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +25: [2023-05-13 03:28:35,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +16: [2023-05-13 03:28:35,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +17: [2023-05-13 03:28:35,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 8: [2023-05-13 03:28:35,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +25: [2023-05-13 03:28:35,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +25: [2023-05-13 03:28:35,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +16: [2023-05-13 03:28:35,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 0: [2023-05-13 03:28:35,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +21: [2023-05-13 03:28:35,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +21: [2023-05-13 03:28:35,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt... +21: [2023-05-13 03:28:35,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +12: [2023-05-13 03:28:35,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +12: [2023-05-13 03:28:35,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +12: [2023-05-13 03:28:35,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +28: [2023-05-13 03:28:35,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +16: [2023-05-13 03:28:35,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +26: [2023-05-13 03:28:35,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +12: [2023-05-13 03:28:35,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 3: [2023-05-13 03:28:35,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +26: [2023-05-13 03:28:35,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +26: [2023-05-13 03:28:35,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +16: [2023-05-13 03:28:35,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +20: [2023-05-13 03:28:35,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +25: [2023-05-13 03:28:35,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +25: [2023-05-13 03:28:35,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +28: [2023-05-13 03:28:35,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +16: [2023-05-13 03:28:35,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 0: [2023-05-13 03:28:35,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +26: [2023-05-13 03:28:35,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +25: [2023-05-13 03:28:35,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +25: [2023-05-13 03:28:35,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +25: [2023-05-13 03:28:35,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +23: [2023-05-13 03:28:35,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 9: [2023-05-13 03:28:35,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 9: [2023-05-13 03:28:35,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +28: [2023-05-13 03:28:35,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +28: [2023-05-13 03:28:35,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +28: [2023-05-13 03:28:35,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +28: [2023-05-13 03:28:35,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +23: [2023-05-13 03:28:35,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +12: [2023-05-13 03:28:35,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +12: [2023-05-13 03:28:35,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +12: [2023-05-13 03:28:35,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +12: [2023-05-13 03:28:35,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +26: [2023-05-13 03:28:35,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +26: [2023-05-13 03:28:35,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +23: [2023-05-13 03:28:35,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +17: [2023-05-13 03:28:35,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +23: [2023-05-13 03:28:35,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 9: [2023-05-13 03:28:35,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 9: [2023-05-13 03:28:35,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 9: [2023-05-13 03:28:35,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 3: [2023-05-13 03:28:35,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 3: [2023-05-13 03:28:35,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 3: [2023-05-13 03:28:35,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 3: [2023-05-13 03:28:35,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +20: [2023-05-13 03:28:35,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +20: [2023-05-13 03:28:35,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +20: [2023-05-13 03:28:35,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +20: [2023-05-13 03:28:35,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +23: [2023-05-13 03:28:35,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 1: [2023-05-13 03:28:35,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 1: [2023-05-13 03:28:35,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 1: [2023-05-13 03:28:35,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +25: [2023-05-13 03:28:35,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +20: [2023-05-13 03:28:35,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +20: [2023-05-13 03:28:35,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +20: [2023-05-13 03:28:35,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +25: [2023-05-13 03:28:35,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 1: [2023-05-13 03:28:35,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 1: [2023-05-13 03:28:35,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +25: [2023-05-13 03:28:35,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +26: [2023-05-13 03:28:35,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +12: [2023-05-13 03:28:35,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 1: [2023-05-13 03:28:35,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +17: [2023-05-13 03:28:35,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +12: [2023-05-13 03:28:35,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +20: [2023-05-13 03:28:35,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +12: [2023-05-13 03:28:35,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +12: [2023-05-13 03:28:35,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +26: [2023-05-13 03:28:35,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +26: [2023-05-13 03:28:35,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +26: [2023-05-13 03:28:35,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +26: [2023-05-13 03:28:35,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +17: [2023-05-13 03:28:35,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +17: [2023-05-13 03:28:35,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +17: [2023-05-13 03:28:35,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +25: [2023-05-13 03:28:35,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 8: [2023-05-13 03:28:35,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +26: [2023-05-13 03:28:35,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +17: [2023-05-13 03:28:35,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 8: [2023-05-13 03:28:35,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +12: [2023-05-13 03:28:35,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +25: [2023-05-13 03:28:35,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +25: [2023-05-13 03:28:35,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +25: [2023-05-13 03:28:35,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +12: [2023-05-13 03:28:35,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +17: [2023-05-13 03:28:35,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +17: [2023-05-13 03:28:35,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +12: [2023-05-13 03:28:35,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +12: [2023-05-13 03:28:35,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 0: [2023-05-13 03:28:35,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 0: [2023-05-13 03:28:35,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 0: [2023-05-13 03:28:35,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 0: [2023-05-13 03:28:35,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 0: [2023-05-13 03:28:35,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 0: [2023-05-13 03:28:35,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +20: [2023-05-13 03:28:35,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +20: [2023-05-13 03:28:35,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +26: [2023-05-13 03:28:35,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +20: [2023-05-13 03:28:35,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +20: [2023-05-13 03:28:35,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +20: [2023-05-13 03:28:35,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +17: [2023-05-13 03:28:35,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +28: [2023-05-13 03:28:35,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +28: [2023-05-13 03:28:35,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +28: [2023-05-13 03:28:35,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +28: [2023-05-13 03:28:35,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +28: [2023-05-13 03:28:35,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +28: [2023-05-13 03:28:35,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +28: [2023-05-13 03:28:35,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +28: [2023-05-13 03:28:35,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 9: [2023-05-13 03:28:35,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +26: [2023-05-13 03:28:35,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_29-model_00-model_states.pt. +17: [2023-05-13 03:28:35,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +17: [2023-05-13 03:28:35,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +17: [2023-05-13 03:28:35,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +17: [2023-05-13 03:28:35,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +17: [2023-05-13 03:28:35,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +17: [2023-05-13 03:28:35,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +27: [2023-05-13 03:28:35,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +27: [2023-05-13 03:28:35,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +27: [2023-05-13 03:28:35,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +27: [2023-05-13 03:28:35,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +27: [2023-05-13 03:28:35,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +27: [2023-05-13 03:28:35,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +27: [2023-05-13 03:28:35,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +27: [2023-05-13 03:28:35,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +27: [2023-05-13 03:28:35,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +27: [2023-05-13 03:28:35,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +27: [2023-05-13 03:28:35,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +27: [2023-05-13 03:28:35,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +27: [2023-05-13 03:28:35,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +27: [2023-05-13 03:28:35,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +27: [2023-05-13 03:28:35,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +27: [2023-05-13 03:28:35,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +11: [2023-05-13 03:28:35,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +11: [2023-05-13 03:28:35,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +11: [2023-05-13 03:28:35,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +11: [2023-05-13 03:28:35,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +11: [2023-05-13 03:28:35,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +11: [2023-05-13 03:28:35,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +11: [2023-05-13 03:28:35,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +11: [2023-05-13 03:28:35,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +11: [2023-05-13 03:28:35,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +11: [2023-05-13 03:28:35,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +11: [2023-05-13 03:28:35,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +11: [2023-05-13 03:28:35,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +11: [2023-05-13 03:28:35,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +11: [2023-05-13 03:28:35,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +11: [2023-05-13 03:28:35,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +11: [2023-05-13 03:28:35,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +10: [2023-05-13 03:28:35,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +10: [2023-05-13 03:28:35,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +10: [2023-05-13 03:28:35,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +10: [2023-05-13 03:28:35,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +10: [2023-05-13 03:28:35,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +10: [2023-05-13 03:28:35,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +10: [2023-05-13 03:28:35,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +10: [2023-05-13 03:28:35,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +27: [2023-05-13 03:28:35,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +10: [2023-05-13 03:28:35,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +10: [2023-05-13 03:28:35,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +10: [2023-05-13 03:28:35,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +10: [2023-05-13 03:28:35,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +10: [2023-05-13 03:28:35,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +10: [2023-05-13 03:28:35,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +10: [2023-05-13 03:28:35,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +10: [2023-05-13 03:28:35,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +27: [2023-05-13 03:28:35,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +27: [2023-05-13 03:28:35,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +11: [2023-05-13 03:28:35,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +27: [2023-05-13 03:28:35,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +27: [2023-05-13 03:28:35,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +27: [2023-05-13 03:28:35,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +11: [2023-05-13 03:28:35,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +27: [2023-05-13 03:28:35,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +27: [2023-05-13 03:28:35,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +27: [2023-05-13 03:28:35,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +10: [2023-05-13 03:28:35,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +10: [2023-05-13 03:28:35,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +13: [2023-05-13 03:28:35,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +27: [2023-05-13 03:28:35,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +13: [2023-05-13 03:28:35,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +13: [2023-05-13 03:28:35,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +13: [2023-05-13 03:28:35,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +13: [2023-05-13 03:28:35,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +13: [2023-05-13 03:28:35,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +13: [2023-05-13 03:28:35,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +13: [2023-05-13 03:28:35,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +11: [2023-05-13 03:28:35,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +11: [2023-05-13 03:28:35,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +11: [2023-05-13 03:28:35,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +13: [2023-05-13 03:28:35,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +13: [2023-05-13 03:28:35,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +13: [2023-05-13 03:28:35,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +13: [2023-05-13 03:28:35,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +13: [2023-05-13 03:28:35,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +13: [2023-05-13 03:28:35,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +13: [2023-05-13 03:28:35,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +27: [2023-05-13 03:28:35,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +13: [2023-05-13 03:28:35,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +10: [2023-05-13 03:28:35,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +27: [2023-05-13 03:28:35,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +27: [2023-05-13 03:28:35,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +10: [2023-05-13 03:28:35,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +10: [2023-05-13 03:28:35,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +10: [2023-05-13 03:28:35,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +27: [2023-05-13 03:28:35,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +10: [2023-05-13 03:28:35,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +10: [2023-05-13 03:28:35,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +10: [2023-05-13 03:28:35,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +10: [2023-05-13 03:28:35,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +27: [2023-05-13 03:28:35,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +27: [2023-05-13 03:28:35,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +10: [2023-05-13 03:28:35,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +11: [2023-05-13 03:28:35,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +11: [2023-05-13 03:28:35,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +11: [2023-05-13 03:28:35,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +11: [2023-05-13 03:28:35,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +11: [2023-05-13 03:28:35,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +11: [2023-05-13 03:28:35,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +11: [2023-05-13 03:28:35,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +10: [2023-05-13 03:28:35,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +10: [2023-05-13 03:28:35,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +10: [2023-05-13 03:28:35,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +10: [2023-05-13 03:28:35,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +10: [2023-05-13 03:28:35,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +13: [2023-05-13 03:28:35,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +13: [2023-05-13 03:28:35,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +13: [2023-05-13 03:28:35,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +13: [2023-05-13 03:28:35,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +13: [2023-05-13 03:28:35,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +13: [2023-05-13 03:28:35,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +13: [2023-05-13 03:28:35,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +13: [2023-05-13 03:28:35,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +30: [2023-05-13 03:28:35,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +30: [2023-05-13 03:28:35,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +30: [2023-05-13 03:28:35,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +30: [2023-05-13 03:28:35,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +13: [2023-05-13 03:28:35,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +30: [2023-05-13 03:28:35,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +30: [2023-05-13 03:28:35,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +30: [2023-05-13 03:28:35,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +30: [2023-05-13 03:28:35,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +11: [2023-05-13 03:28:35,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +11: [2023-05-13 03:28:35,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +11: [2023-05-13 03:28:35,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +11: [2023-05-13 03:28:35,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +13: [2023-05-13 03:28:35,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +13: [2023-05-13 03:28:35,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +30: [2023-05-13 03:28:35,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +30: [2023-05-13 03:28:35,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +30: [2023-05-13 03:28:35,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +30: [2023-05-13 03:28:35,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +30: [2023-05-13 03:28:35,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +30: [2023-05-13 03:28:35,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +30: [2023-05-13 03:28:35,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +30: [2023-05-13 03:28:35,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +13: [2023-05-13 03:28:35,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +13: [2023-05-13 03:28:35,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +13: [2023-05-13 03:28:35,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +13: [2023-05-13 03:28:35,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +13: [2023-05-13 03:28:35,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +18: [2023-05-13 03:28:35,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +18: [2023-05-13 03:28:35,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 6: [2023-05-13 03:28:35,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 6: [2023-05-13 03:28:35,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 6: [2023-05-13 03:28:35,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 6: [2023-05-13 03:28:35,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 6: [2023-05-13 03:28:35,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 6: [2023-05-13 03:28:35,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 6: [2023-05-13 03:28:35,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 6: [2023-05-13 03:28:35,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +18: [2023-05-13 03:28:35,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +18: [2023-05-13 03:28:35,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +18: [2023-05-13 03:28:35,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +18: [2023-05-13 03:28:35,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +18: [2023-05-13 03:28:35,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +18: [2023-05-13 03:28:35,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +18: [2023-05-13 03:28:35,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +18: [2023-05-13 03:28:35,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 6: [2023-05-13 03:28:35,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +18: [2023-05-13 03:28:35,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +29: [2023-05-13 03:28:35,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 6: [2023-05-13 03:28:35,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +18: [2023-05-13 03:28:35,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +29: [2023-05-13 03:28:35,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +18: [2023-05-13 03:28:35,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +18: [2023-05-13 03:28:35,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +18: [2023-05-13 03:28:35,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 6: [2023-05-13 03:28:35,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +18: [2023-05-13 03:28:35,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 6: [2023-05-13 03:28:35,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +29: [2023-05-13 03:28:35,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 6: [2023-05-13 03:28:35,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +29: [2023-05-13 03:28:35,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +29: [2023-05-13 03:28:35,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +29: [2023-05-13 03:28:35,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +29: [2023-05-13 03:28:35,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +29: [2023-05-13 03:28:35,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 6: [2023-05-13 03:28:35,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +29: [2023-05-13 03:28:35,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 6: [2023-05-13 03:28:35,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 6: [2023-05-13 03:28:35,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +15: [2023-05-13 03:28:35,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +15: [2023-05-13 03:28:35,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +29: [2023-05-13 03:28:35,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +15: [2023-05-13 03:28:35,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +15: [2023-05-13 03:28:35,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +15: [2023-05-13 03:28:35,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +15: [2023-05-13 03:28:35,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +15: [2023-05-13 03:28:35,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +15: [2023-05-13 03:28:35,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +29: [2023-05-13 03:28:35,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +15: [2023-05-13 03:28:35,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +29: [2023-05-13 03:28:35,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +30: [2023-05-13 03:28:35,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +29: [2023-05-13 03:28:35,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +29: [2023-05-13 03:28:35,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +29: [2023-05-13 03:28:35,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +31: [2023-05-13 03:28:35,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +31: [2023-05-13 03:28:35,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +15: [2023-05-13 03:28:35,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +31: [2023-05-13 03:28:35,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +31: [2023-05-13 03:28:35,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +31: [2023-05-13 03:28:35,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +29: [2023-05-13 03:28:35,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +31: [2023-05-13 03:28:35,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +31: [2023-05-13 03:28:35,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +31: [2023-05-13 03:28:35,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +15: [2023-05-13 03:28:35,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +15: [2023-05-13 03:28:35,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +30: [2023-05-13 03:28:35,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +30: [2023-05-13 03:28:35,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +15: [2023-05-13 03:28:35,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +31: [2023-05-13 03:28:35,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +31: [2023-05-13 03:28:35,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +15: [2023-05-13 03:28:35,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +30: [2023-05-13 03:28:35,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +15: [2023-05-13 03:28:35,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +15: [2023-05-13 03:28:35,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +31: [2023-05-13 03:28:35,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +31: [2023-05-13 03:28:35,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +31: [2023-05-13 03:28:35,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +31: [2023-05-13 03:28:35,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +31: [2023-05-13 03:28:35,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +31: [2023-05-13 03:28:35,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +30: [2023-05-13 03:28:35,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +30: [2023-05-13 03:28:35,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +30: [2023-05-13 03:28:35,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +30: [2023-05-13 03:28:35,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +30: [2023-05-13 03:28:35,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +18: [2023-05-13 03:28:35,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +30: [2023-05-13 03:28:35,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +30: [2023-05-13 03:28:35,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +30: [2023-05-13 03:28:35,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 6: [2023-05-13 03:28:35,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +15: [2023-05-13 03:28:35,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +18: [2023-05-13 03:28:35,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +18: [2023-05-13 03:28:35,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +29: [2023-05-13 03:28:35,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +29: [2023-05-13 03:28:35,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +28: [2023-05-13 03:28:35,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +18: [2023-05-13 03:28:35,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +28: [2023-05-13 03:28:35,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +28: [2023-05-13 03:28:35,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +28: [2023-05-13 03:28:35,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +28: [2023-05-13 03:28:35,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +28: [2023-05-13 03:28:35,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +28: [2023-05-13 03:28:35,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +28: [2023-05-13 03:28:35,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +24: [2023-05-13 03:28:35,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +24: [2023-05-13 03:28:35,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +24: [2023-05-13 03:28:35,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +24: [2023-05-13 03:28:35,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +24: [2023-05-13 03:28:35,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +24: [2023-05-13 03:28:35,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +22: [2023-05-13 03:28:35,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +24: [2023-05-13 03:28:35,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +24: [2023-05-13 03:28:35,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +22: [2023-05-13 03:28:35,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +22: [2023-05-13 03:28:35,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +22: [2023-05-13 03:28:35,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +22: [2023-05-13 03:28:35,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +22: [2023-05-13 03:28:35,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +22: [2023-05-13 03:28:35,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +22: [2023-05-13 03:28:35,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +28: [2023-05-13 03:28:35,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +18: [2023-05-13 03:28:35,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +18: [2023-05-13 03:28:35,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +22: [2023-05-13 03:28:35,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +24: [2023-05-13 03:28:35,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +22: [2023-05-13 03:28:35,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +24: [2023-05-13 03:28:35,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +24: [2023-05-13 03:28:35,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +24: [2023-05-13 03:28:35,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +24: [2023-05-13 03:28:35,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +24: [2023-05-13 03:28:35,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +30: [2023-05-13 03:28:35,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +22: [2023-05-13 03:28:35,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +30: [2023-05-13 03:28:35,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +29: [2023-05-13 03:28:35,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +30: [2023-05-13 03:28:35,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +30: [2023-05-13 03:28:35,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +28: [2023-05-13 03:28:35,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +24: [2023-05-13 03:28:35,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +28: [2023-05-13 03:28:35,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +31: [2023-05-13 03:28:35,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +31: [2023-05-13 03:28:35,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +24: [2023-05-13 03:28:35,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +28: [2023-05-13 03:28:35,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +18: [2023-05-13 03:28:35,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +18: [2023-05-13 03:28:35,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +22: [2023-05-13 03:28:35,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +18: [2023-05-13 03:28:35,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +22: [2023-05-13 03:28:35,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +28: [2023-05-13 03:28:35,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +28: [2023-05-13 03:28:35,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +22: [2023-05-13 03:28:35,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +22: [2023-05-13 03:28:35,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +28: [2023-05-13 03:28:35,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +22: [2023-05-13 03:28:35,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +28: [2023-05-13 03:28:35,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +15: [2023-05-13 03:28:35,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 9: [2023-05-13 03:28:35,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 9: [2023-05-13 03:28:35,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 9: [2023-05-13 03:28:35,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 9: [2023-05-13 03:28:35,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 9: [2023-05-13 03:28:35,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 6: [2023-05-13 03:28:35,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 6: [2023-05-13 03:28:35,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 9: [2023-05-13 03:28:35,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 6: [2023-05-13 03:28:35,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 6: [2023-05-13 03:28:35,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +18: [2023-05-13 03:28:35,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +29: [2023-05-13 03:28:35,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +18: [2023-05-13 03:28:35,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 0: [2023-05-13 03:28:35,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +29: [2023-05-13 03:28:35,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +15: [2023-05-13 03:28:35,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +17: [2023-05-13 03:28:35,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +17: [2023-05-13 03:28:35,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +17: [2023-05-13 03:28:35,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +17: [2023-05-13 03:28:35,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +17: [2023-05-13 03:28:35,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +17: [2023-05-13 03:28:35,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +17: [2023-05-13 03:28:35,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +17: [2023-05-13 03:28:35,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 6: [2023-05-13 03:28:35,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 6: [2023-05-13 03:28:35,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 6: [2023-05-13 03:28:35,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 6: [2023-05-13 03:28:35,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +26: [2023-05-13 03:28:35,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +26: [2023-05-13 03:28:35,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +15: [2023-05-13 03:28:35,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +18: [2023-05-13 03:28:35,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +29: [2023-05-13 03:28:35,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +17: [2023-05-13 03:28:35,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +12: [2023-05-13 03:28:35,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +12: [2023-05-13 03:28:35,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +12: [2023-05-13 03:28:35,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +12: [2023-05-13 03:28:35,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +12: [2023-05-13 03:28:35,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +12: [2023-05-13 03:28:35,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +12: [2023-05-13 03:28:35,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +12: [2023-05-13 03:28:35,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 9: [2023-05-13 03:28:35,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +25: [2023-05-13 03:28:35,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +25: [2023-05-13 03:28:35,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +26: [2023-05-13 03:28:35,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +26: [2023-05-13 03:28:35,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +26: [2023-05-13 03:28:35,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +26: [2023-05-13 03:28:35,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +26: [2023-05-13 03:28:35,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +26: [2023-05-13 03:28:35,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +14: [2023-05-13 03:28:35,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +14: [2023-05-13 03:28:35,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +29: [2023-05-13 03:28:35,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +29: [2023-05-13 03:28:35,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +29: [2023-05-13 03:28:35,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +14: [2023-05-13 03:28:35,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +25: [2023-05-13 03:28:35,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +25: [2023-05-13 03:28:35,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +26: [2023-05-13 03:28:35,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +14: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +25: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +25: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +25: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +26: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +14: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +14: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +14: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +25: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 2: [2023-05-13 03:28:35,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 2: [2023-05-13 03:28:35,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 2: [2023-05-13 03:28:35,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 2: [2023-05-13 03:28:35,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 2: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 2: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 2: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +14: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 2: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +20: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +20: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +21: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +21: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +31: [2023-05-13 03:28:35,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 3: [2023-05-13 03:28:35,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 5: [2023-05-13 03:28:35,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +16: [2023-05-13 03:28:35,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +16: [2023-05-13 03:28:35,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 5: [2023-05-13 03:28:35,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 5: [2023-05-13 03:28:35,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 5: [2023-05-13 03:28:35,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +18: [2023-05-13 03:28:35,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +29: [2023-05-13 03:28:35,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +12: [2023-05-13 03:28:35,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 5: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 5: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +31: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 5: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 5: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +16: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +21: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +16: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +12: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +16: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +16: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +16: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +23: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +23: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +21: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +17: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +16: [2023-05-13 03:28:35,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +21: [2023-05-13 03:28:35,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +26: [2023-05-13 03:28:35,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +21: [2023-05-13 03:28:35,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +21: [2023-05-13 03:28:35,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +12: [2023-05-13 03:28:35,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +19: [2023-05-13 03:28:35,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +19: [2023-05-13 03:28:35,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +21: [2023-05-13 03:28:35,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +23: [2023-05-13 03:28:35,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +23: [2023-05-13 03:28:35,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +31: [2023-05-13 03:28:35,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +12: [2023-05-13 03:28:35,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +25: [2023-05-13 03:28:35,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +25: [2023-05-13 03:28:35,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 0: [2023-05-13 03:28:35,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +23: [2023-05-13 03:28:35,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +23: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +23: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +17: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +25: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +23: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +20: [2023-05-13 03:28:35,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +20: [2023-05-13 03:28:35,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +20: [2023-05-13 03:28:35,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +20: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +20: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +20: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +12: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 8: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +29: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 3: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 3: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 3: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 3: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +12: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 8: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +17: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +12: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +14: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +14: [2023-05-13 03:28:35,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 2: [2023-05-13 03:28:35,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +12: [2023-05-13 03:28:35,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 2: [2023-05-13 03:28:35,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +17: [2023-05-13 03:28:35,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +19: [2023-05-13 03:28:35,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +17: [2023-05-13 03:28:35,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 5: [2023-05-13 03:28:35,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +16: [2023-05-13 03:28:35,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +14: [2023-05-13 03:28:35,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +17: [2023-05-13 03:28:35,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +19: [2023-05-13 03:28:35,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +19: [2023-05-13 03:28:35,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +19: [2023-05-13 03:28:35,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +19: [2023-05-13 03:28:35,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +20: [2023-05-13 03:28:35,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +18: [2023-05-13 03:28:35,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +20: [2023-05-13 03:28:35,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +19: [2023-05-13 03:28:35,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +21: [2023-05-13 03:28:35,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +21: [2023-05-13 03:28:35,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 5: [2023-05-13 03:28:35,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +18: [2023-05-13 03:28:35,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 5: [2023-05-13 03:28:35,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +26: [2023-05-13 03:28:35,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 5: [2023-05-13 03:28:35,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +17: [2023-05-13 03:28:35,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +21: [2023-05-13 03:28:35,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +25: [2023-05-13 03:28:35,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +26: [2023-05-13 03:28:35,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +16: [2023-05-13 03:28:35,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +23: [2023-05-13 03:28:35,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +31: [2023-05-13 03:28:35,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +31: [2023-05-13 03:28:35,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +26: [2023-05-13 03:28:35,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 5: [2023-05-13 03:28:35,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 1: [2023-05-13 03:28:35,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 1: [2023-05-13 03:28:35,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +16: [2023-05-13 03:28:35,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +25: [2023-05-13 03:28:35,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +19: [2023-05-13 03:28:35,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +14: [2023-05-13 03:28:35,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +14: [2023-05-13 03:28:35,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +26: [2023-05-13 03:28:35,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +25: [2023-05-13 03:28:35,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +14: [2023-05-13 03:28:35,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +23: [2023-05-13 03:28:35,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +16: [2023-05-13 03:28:35,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +25: [2023-05-13 03:28:35,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +26: [2023-05-13 03:28:35,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +16: [2023-05-13 03:28:35,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +16: [2023-05-13 03:28:35,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 1: [2023-05-13 03:28:35,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 1: [2023-05-13 03:28:35,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +25: [2023-05-13 03:28:35,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 5: [2023-05-13 03:28:35,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 1: [2023-05-13 03:28:35,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +31: [2023-05-13 03:28:35,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +31: [2023-05-13 03:28:35,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +31: [2023-05-13 03:28:35,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +14: [2023-05-13 03:28:35,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +14: [2023-05-13 03:28:35,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 5: [2023-05-13 03:28:35,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +18: [2023-05-13 03:28:35,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +19: [2023-05-13 03:28:35,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 2: [2023-05-13 03:28:35,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 2: [2023-05-13 03:28:35,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +15: [2023-05-13 03:28:35,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +15: [2023-05-13 03:28:35,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +20: [2023-05-13 03:28:35,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +16: [2023-05-13 03:28:35,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +19: [2023-05-13 03:28:35,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 2: [2023-05-13 03:28:35,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 5: [2023-05-13 03:28:35,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +16: [2023-05-13 03:28:35,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 2: [2023-05-13 03:28:35,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 2: [2023-05-13 03:28:35,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +19: [2023-05-13 03:28:35,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +19: [2023-05-13 03:28:35,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +21: [2023-05-13 03:28:35,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +21: [2023-05-13 03:28:35,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 8: [2023-05-13 03:28:35,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +21: [2023-05-13 03:28:35,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +23: [2023-05-13 03:28:35,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +23: [2023-05-13 03:28:35,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 8: [2023-05-13 03:28:35,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +19: [2023-05-13 03:28:35,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +21: [2023-05-13 03:28:35,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +23: [2023-05-13 03:28:35,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +19: [2023-05-13 03:28:35,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +15: [2023-05-13 03:28:35,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +19: [2023-05-13 03:28:35,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +15: [2023-05-13 03:28:35,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +15: [2023-05-13 03:28:35,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 2: [2023-05-13 03:28:35,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 8: [2023-05-13 03:28:35,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +20: [2023-05-13 03:28:35,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +21: [2023-05-13 03:28:35,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 8: [2023-05-13 03:28:35,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +23: [2023-05-13 03:28:35,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +20: [2023-05-13 03:28:35,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +23: [2023-05-13 03:28:35,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +23: [2023-05-13 03:28:35,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 8: [2023-05-13 03:28:35,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +20: [2023-05-13 03:28:35,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +20: [2023-05-13 03:28:35,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +20: [2023-05-13 03:28:35,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 6: [2023-05-13 03:28:35,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +15: [2023-05-13 03:28:35,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +28: [2023-05-13 03:28:35,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +15: [2023-05-13 03:28:35,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 6: [2023-05-13 03:28:35,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +22: [2023-05-13 03:28:35,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 6: [2023-05-13 03:28:35,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 6: [2023-05-13 03:28:35,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 6: [2023-05-13 03:28:35,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 6: [2023-05-13 03:28:35,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 6: [2023-05-13 03:28:35,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +24: [2023-05-13 03:28:35,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +29: [2023-05-13 03:28:35,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +31: [2023-05-13 03:28:35,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +22: [2023-05-13 03:28:35,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +24: [2023-05-13 03:28:35,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +24: [2023-05-13 03:28:35,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 9: [2023-05-13 03:28:35,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +29: [2023-05-13 03:28:35,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +22: [2023-05-13 03:28:35,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +31: [2023-05-13 03:28:35,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +29: [2023-05-13 03:28:35,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +28: [2023-05-13 03:28:35,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +29: [2023-05-13 03:28:35,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +29: [2023-05-13 03:28:35,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +31: [2023-05-13 03:28:35,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +31: [2023-05-13 03:28:35,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +31: [2023-05-13 03:28:35,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +31: [2023-05-13 03:28:35,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +24: [2023-05-13 03:28:35,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +24: [2023-05-13 03:28:35,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +24: [2023-05-13 03:28:35,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +24: [2023-05-13 03:28:35,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +24: [2023-05-13 03:28:35,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +17: [2023-05-13 03:28:35,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +15: [2023-05-13 03:28:35,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +22: [2023-05-13 03:28:35,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 0: [2023-05-13 03:28:35,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +15: [2023-05-13 03:28:35,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +12: [2023-05-13 03:28:35,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +12: [2023-05-13 03:28:35,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +15: [2023-05-13 03:28:35,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +15: [2023-05-13 03:28:35,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +15: [2023-05-13 03:28:35,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +28: [2023-05-13 03:28:35,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +28: [2023-05-13 03:28:35,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +28: [2023-05-13 03:28:35,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +26: [2023-05-13 03:28:35,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +26: [2023-05-13 03:28:35,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +26: [2023-05-13 03:28:35,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 1: [2023-05-13 03:28:35,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +28: [2023-05-13 03:28:35,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +28: [2023-05-13 03:28:35,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +28: [2023-05-13 03:28:35,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +28: [2023-05-13 03:28:35,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +22: [2023-05-13 03:28:35,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 2: [2023-05-13 03:28:35,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 2: [2023-05-13 03:28:35,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +24: [2023-05-13 03:28:35,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +14: [2023-05-13 03:28:35,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +16: [2023-05-13 03:28:35,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 5: [2023-05-13 03:28:35,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +25: [2023-05-13 03:28:35,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +25: [2023-05-13 03:28:35,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +25: [2023-05-13 03:28:35,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +22: [2023-05-13 03:28:35,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +14: [2023-05-13 03:28:35,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +16: [2023-05-13 03:28:35,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +21: [2023-05-13 03:28:35,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +21: [2023-05-13 03:28:35,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +21: [2023-05-13 03:28:35,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 3: [2023-05-13 03:28:35,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +23: [2023-05-13 03:28:35,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +14: [2023-05-13 03:28:35,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +24: [2023-05-13 03:28:35,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +20: [2023-05-13 03:28:35,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +20: [2023-05-13 03:28:35,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +22: [2023-05-13 03:28:35,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +22: [2023-05-13 03:28:35,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +22: [2023-05-13 03:28:35,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +24: [2023-05-13 03:28:35,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +22: [2023-05-13 03:28:35,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +22: [2023-05-13 03:28:35,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +23: [2023-05-13 03:28:35,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 9: [2023-05-13 03:28:35,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +19: [2023-05-13 03:28:35,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 5: [2023-05-13 03:28:35,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 5: [2023-05-13 03:28:35,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 5: [2023-05-13 03:28:35,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 5: [2023-05-13 03:28:35,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +17: [2023-05-13 03:28:35,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +12: [2023-05-13 03:28:35,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +19: [2023-05-13 03:28:35,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +12: [2023-05-13 03:28:35,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +12: [2023-05-13 03:28:35,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +19: [2023-05-13 03:28:35,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +25: [2023-05-13 03:28:35,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +16: [2023-05-13 03:28:35,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +16: [2023-05-13 03:28:35,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +16: [2023-05-13 03:28:35,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 9: [2023-05-13 03:28:35,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 9: [2023-05-13 03:28:35,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +26: [2023-05-13 03:28:35,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +26: [2023-05-13 03:28:35,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +19: [2023-05-13 03:28:35,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +19: [2023-05-13 03:28:35,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +19: [2023-05-13 03:28:35,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +24: [2023-05-13 03:28:35,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +17: [2023-05-13 03:28:35,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +14: [2023-05-13 03:28:35,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +20: [2023-05-13 03:28:35,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +12: [2023-05-13 03:28:35,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +16: [2023-05-13 03:28:35,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 9: [2023-05-13 03:28:35,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 9: [2023-05-13 03:28:35,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 9: [2023-05-13 03:28:35,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 9: [2023-05-13 03:28:35,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +16: [2023-05-13 03:28:35,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +16: [2023-05-13 03:28:35,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +12: [2023-05-13 03:28:35,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +26: [2023-05-13 03:28:35,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +26: [2023-05-13 03:28:35,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +25: [2023-05-13 03:28:35,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +25: [2023-05-13 03:28:35,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +25: [2023-05-13 03:28:35,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +26: [2023-05-13 03:28:35,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +25: [2023-05-13 03:28:35,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +24: [2023-05-13 03:28:35,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 0: [2023-05-13 03:28:35,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 3: [2023-05-13 03:28:35,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +21: [2023-05-13 03:28:35,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +21: [2023-05-13 03:28:35,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +14: [2023-05-13 03:28:35,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +14: [2023-05-13 03:28:35,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +14: [2023-05-13 03:28:35,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +14: [2023-05-13 03:28:35,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +26: [2023-05-13 03:28:35,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 8: [2023-05-13 03:28:35,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +26: [2023-05-13 03:28:35,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +24: [2023-05-13 03:28:35,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 8: [2023-05-13 03:28:35,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +24: [2023-05-13 03:28:35,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +26: [2023-05-13 03:28:35,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +21: [2023-05-13 03:28:35,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +21: [2023-05-13 03:28:35,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +21: [2023-05-13 03:28:35,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +19: [2023-05-13 03:28:35,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +24: [2023-05-13 03:28:35,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 8: [2023-05-13 03:28:35,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +23: [2023-05-13 03:28:35,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +16: [2023-05-13 03:28:35,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 2: [2023-05-13 03:28:35,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 2: [2023-05-13 03:28:35,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 2: [2023-05-13 03:28:35,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 2: [2023-05-13 03:28:35,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 2: [2023-05-13 03:28:35,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 2: [2023-05-13 03:28:35,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +12: [2023-05-13 03:28:35,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +21: [2023-05-13 03:28:35,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 0: [2023-05-13 03:28:35,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 0: [2023-05-13 03:28:35,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 2: [2023-05-13 03:28:35,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +21: [2023-05-13 03:28:35,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +25: [2023-05-13 03:28:35,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +21: [2023-05-13 03:28:35,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +25: [2023-05-13 03:28:35,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +16: [2023-05-13 03:28:35,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +19: [2023-05-13 03:28:35,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +17: [2023-05-13 03:28:35,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +12: [2023-05-13 03:28:35,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +17: [2023-05-13 03:28:35,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +23: [2023-05-13 03:28:35,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +23: [2023-05-13 03:28:35,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 2: [2023-05-13 03:28:35,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +23: [2023-05-13 03:28:35,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +23: [2023-05-13 03:28:35,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +23: [2023-05-13 03:28:35,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +20: [2023-05-13 03:28:35,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +20: [2023-05-13 03:28:35,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +20: [2023-05-13 03:28:35,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 1: [2023-05-13 03:28:35,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +17: [2023-05-13 03:28:35,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +17: [2023-05-13 03:28:35,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +17: [2023-05-13 03:28:35,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +25: [2023-05-13 03:28:35,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +28: [2023-05-13 03:28:35,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +17: [2023-05-13 03:28:35,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +23: [2023-05-13 03:28:35,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +22: [2023-05-13 03:28:35,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 3: [2023-05-13 03:28:35,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 3: [2023-05-13 03:28:35,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +12: [2023-05-13 03:28:35,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +23: [2023-05-13 03:28:35,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +20: [2023-05-13 03:28:35,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +20: [2023-05-13 03:28:35,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +20: [2023-05-13 03:28:35,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +20: [2023-05-13 03:28:35,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +22: [2023-05-13 03:28:35,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +28: [2023-05-13 03:28:35,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +22: [2023-05-13 03:28:35,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +28: [2023-05-13 03:28:35,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +12: [2023-05-13 03:28:35,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +28: [2023-05-13 03:28:35,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +12: [2023-05-13 03:28:35,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 8: [2023-05-13 03:28:35,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +12: [2023-05-13 03:28:35,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +28: [2023-05-13 03:28:35,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +28: [2023-05-13 03:28:35,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +19: [2023-05-13 03:28:35,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +22: [2023-05-13 03:28:35,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +28: [2023-05-13 03:28:35,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +17: [2023-05-13 03:28:35,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 1: [2023-05-13 03:28:35,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +16: [2023-05-13 03:28:35,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +22: [2023-05-13 03:28:35,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +26: [2023-05-13 03:28:35,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 1: [2023-05-13 03:28:35,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 1: [2023-05-13 03:28:35,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +20: [2023-05-13 03:28:35,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 8: [2023-05-13 03:28:35,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +21: [2023-05-13 03:28:35,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +19: [2023-05-13 03:28:35,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +16: [2023-05-13 03:28:35,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +16: [2023-05-13 03:28:35,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 1: [2023-05-13 03:28:35,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +19: [2023-05-13 03:28:35,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 1: [2023-05-13 03:28:35,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 1: [2023-05-13 03:28:35,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 0: [2023-05-13 03:28:35,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +16: [2023-05-13 03:28:35,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +26: [2023-05-13 03:28:35,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +26: [2023-05-13 03:28:35,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +26: [2023-05-13 03:28:35,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +26: [2023-05-13 03:28:35,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +21: [2023-05-13 03:28:35,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +19: [2023-05-13 03:28:35,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +19: [2023-05-13 03:28:35,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 0: [2023-05-13 03:28:35,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. +25: [2023-05-13 03:28:35,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +25: [2023-05-13 03:28:35,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +25: [2023-05-13 03:28:35,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +16: [2023-05-13 03:28:35,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +19: [2023-05-13 03:28:35,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +25: [2023-05-13 03:28:35,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +25: [2023-05-13 03:28:35,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 5: [2023-05-13 03:28:35,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 5: [2023-05-13 03:28:35,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 5: [2023-05-13 03:28:35,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 5: [2023-05-13 03:28:35,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 5: [2023-05-13 03:28:35,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 5: [2023-05-13 03:28:35,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 5: [2023-05-13 03:28:35,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 5: [2023-05-13 03:28:35,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 5: [2023-05-13 03:28:35,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +16: [2023-05-13 03:28:35,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 5: [2023-05-13 03:28:35,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 5: [2023-05-13 03:28:35,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +21: [2023-05-13 03:28:35,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +21: [2023-05-13 03:28:35,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +21: [2023-05-13 03:28:35,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +19: [2023-05-13 03:28:35,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +23: [2023-05-13 03:28:35,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +19: [2023-05-13 03:28:35,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 2: [2023-05-13 03:28:35,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 9: [2023-05-13 03:28:35,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +12: [2023-05-13 03:28:35,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +23: [2023-05-13 03:28:35,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +17: [2023-05-13 03:28:35,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 2: [2023-05-13 03:28:35,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +23: [2023-05-13 03:28:35,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +12: [2023-05-13 03:28:35,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +12: [2023-05-13 03:28:35,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +20: [2023-05-13 03:28:35,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +14: [2023-05-13 03:28:35,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +14: [2023-05-13 03:28:35,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +14: [2023-05-13 03:28:35,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +14: [2023-05-13 03:28:35,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +14: [2023-05-13 03:28:35,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +14: [2023-05-13 03:28:35,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +14: [2023-05-13 03:28:35,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +14: [2023-05-13 03:28:35,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +23: [2023-05-13 03:28:35,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +20: [2023-05-13 03:28:35,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 2: [2023-05-13 03:28:35,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 0: [2023-05-13 03:28:35,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 0: [2023-05-13 03:28:35,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 0: [2023-05-13 03:28:35,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 8: [2023-05-13 03:28:35,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 2: [2023-05-13 03:28:35,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 2: [2023-05-13 03:28:35,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 2: [2023-05-13 03:28:35,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 0: [2023-05-13 03:28:35,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 8: [2023-05-13 03:28:35,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +17: [2023-05-13 03:28:35,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +23: [2023-05-13 03:28:35,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 0: [2023-05-13 03:28:35,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +17: [2023-05-13 03:28:35,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 8: [2023-05-13 03:28:35,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +17: [2023-05-13 03:28:35,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +20: [2023-05-13 03:28:35,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +20: [2023-05-13 03:28:35,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +20: [2023-05-13 03:28:35,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 8: [2023-05-13 03:28:35,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +23: [2023-05-13 03:28:35,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +17: [2023-05-13 03:28:35,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +17: [2023-05-13 03:28:35,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 3: [2023-05-13 03:28:35,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 0: [2023-05-13 03:28:35,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt... +27: [2023-05-13 03:28:35,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +27: [2023-05-13 03:28:35,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +27: [2023-05-13 03:28:35,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +27: [2023-05-13 03:28:35,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +27: [2023-05-13 03:28:35,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +27: [2023-05-13 03:28:35,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +27: [2023-05-13 03:28:35,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +27: [2023-05-13 03:28:35,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +27: [2023-05-13 03:28:35,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +27: [2023-05-13 03:28:35,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +27: [2023-05-13 03:28:35,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +27: [2023-05-13 03:28:35,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +27: [2023-05-13 03:28:35,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +27: [2023-05-13 03:28:35,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +27: [2023-05-13 03:28:35,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +27: [2023-05-13 03:28:35,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_30-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +27: [2023-05-13 03:28:35,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 4: [2023-05-13 03:28:35,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 4: [2023-05-13 03:28:35,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +27: [2023-05-13 03:28:35,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +27: [2023-05-13 03:28:35,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +27: [2023-05-13 03:28:35,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +27: [2023-05-13 03:28:35,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +27: [2023-05-13 03:28:35,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +27: [2023-05-13 03:28:35,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +27: [2023-05-13 03:28:35,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +27: [2023-05-13 03:28:35,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +27: [2023-05-13 03:28:35,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +27: [2023-05-13 03:28:35,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +27: [2023-05-13 03:28:35,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +13: [2023-05-13 03:28:35,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +30: [2023-05-13 03:28:35,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +30: [2023-05-13 03:28:35,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +13: [2023-05-13 03:28:35,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +30: [2023-05-13 03:28:35,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +30: [2023-05-13 03:28:35,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +30: [2023-05-13 03:28:35,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +13: [2023-05-13 03:28:35,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +13: [2023-05-13 03:28:35,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +13: [2023-05-13 03:28:35,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +30: [2023-05-13 03:28:35,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +30: [2023-05-13 03:28:35,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +13: [2023-05-13 03:28:35,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +13: [2023-05-13 03:28:35,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +30: [2023-05-13 03:28:35,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +13: [2023-05-13 03:28:35,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +30: [2023-05-13 03:28:35,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +27: [2023-05-13 03:28:35,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +30: [2023-05-13 03:28:35,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +30: [2023-05-13 03:28:35,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +13: [2023-05-13 03:28:35,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +13: [2023-05-13 03:28:35,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +13: [2023-05-13 03:28:35,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +13: [2023-05-13 03:28:35,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +13: [2023-05-13 03:28:35,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +30: [2023-05-13 03:28:35,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +30: [2023-05-13 03:28:35,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +13: [2023-05-13 03:28:35,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +30: [2023-05-13 03:28:35,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +27: [2023-05-13 03:28:35,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +30: [2023-05-13 03:28:35,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +13: [2023-05-13 03:28:35,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +27: [2023-05-13 03:28:35,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +30: [2023-05-13 03:28:35,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +27: [2023-05-13 03:28:35,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +13: [2023-05-13 03:28:35,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +10: [2023-05-13 03:28:35,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +10: [2023-05-13 03:28:35,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +10: [2023-05-13 03:28:35,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +10: [2023-05-13 03:28:35,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +10: [2023-05-13 03:28:35,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +10: [2023-05-13 03:28:35,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +10: [2023-05-13 03:28:35,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +10: [2023-05-13 03:28:35,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +10: [2023-05-13 03:28:35,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +10: [2023-05-13 03:28:35,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +10: [2023-05-13 03:28:35,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +10: [2023-05-13 03:28:35,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +10: [2023-05-13 03:28:35,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +10: [2023-05-13 03:28:35,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +10: [2023-05-13 03:28:35,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +10: [2023-05-13 03:28:35,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +13: [2023-05-13 03:28:35,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +13: [2023-05-13 03:28:35,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +30: [2023-05-13 03:28:35,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +30: [2023-05-13 03:28:35,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +30: [2023-05-13 03:28:35,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +30: [2023-05-13 03:28:35,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +30: [2023-05-13 03:28:35,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +13: [2023-05-13 03:28:35,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +13: [2023-05-13 03:28:35,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +10: [2023-05-13 03:28:35,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +13: [2023-05-13 03:28:35,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +10: [2023-05-13 03:28:35,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +30: [2023-05-13 03:28:35,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +13: [2023-05-13 03:28:35,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +11: [2023-05-13 03:28:35,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +11: [2023-05-13 03:28:35,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +11: [2023-05-13 03:28:35,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +11: [2023-05-13 03:28:35,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +11: [2023-05-13 03:28:35,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +11: [2023-05-13 03:28:35,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +11: [2023-05-13 03:28:35,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +11: [2023-05-13 03:28:35,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +30: [2023-05-13 03:28:35,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +11: [2023-05-13 03:28:35,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +13: [2023-05-13 03:28:35,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +13: [2023-05-13 03:28:35,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +13: [2023-05-13 03:28:35,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +10: [2023-05-13 03:28:35,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +15: [2023-05-13 03:28:35,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +15: [2023-05-13 03:28:35,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +15: [2023-05-13 03:28:35,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +15: [2023-05-13 03:28:35,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +15: [2023-05-13 03:28:35,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +15: [2023-05-13 03:28:35,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +15: [2023-05-13 03:28:35,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +15: [2023-05-13 03:28:35,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +13: [2023-05-13 03:28:35,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +30: [2023-05-13 03:28:35,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +30: [2023-05-13 03:28:35,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +30: [2023-05-13 03:28:35,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +30: [2023-05-13 03:28:35,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +28: [2023-05-13 03:28:35,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +30: [2023-05-13 03:28:35,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +28: [2023-05-13 03:28:35,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +28: [2023-05-13 03:28:35,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +28: [2023-05-13 03:28:35,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +30: [2023-05-13 03:28:35,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +28: [2023-05-13 03:28:35,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +28: [2023-05-13 03:28:35,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +28: [2023-05-13 03:28:35,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +28: [2023-05-13 03:28:35,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +15: [2023-05-13 03:28:35,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +10: [2023-05-13 03:28:35,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +11: [2023-05-13 03:28:35,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +11: [2023-05-13 03:28:35,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +10: [2023-05-13 03:28:35,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +10: [2023-05-13 03:28:35,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +11: [2023-05-13 03:28:35,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +11: [2023-05-13 03:28:35,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +11: [2023-05-13 03:28:35,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +13: [2023-05-13 03:28:35,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +11: [2023-05-13 03:28:35,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +28: [2023-05-13 03:28:35,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +11: [2023-05-13 03:28:35,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +13: [2023-05-13 03:28:35,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +13: [2023-05-13 03:28:35,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +15: [2023-05-13 03:28:35,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +15: [2023-05-13 03:28:35,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +15: [2023-05-13 03:28:35,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +15: [2023-05-13 03:28:35,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +15: [2023-05-13 03:28:35,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +30: [2023-05-13 03:28:35,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +15: [2023-05-13 03:28:35,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +15: [2023-05-13 03:28:35,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +28: [2023-05-13 03:28:35,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +28: [2023-05-13 03:28:35,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +28: [2023-05-13 03:28:35,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +28: [2023-05-13 03:28:35,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +28: [2023-05-13 03:28:35,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +10: [2023-05-13 03:28:35,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +10: [2023-05-13 03:28:35,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +10: [2023-05-13 03:28:35,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +10: [2023-05-13 03:28:35,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 7: [2023-05-13 03:28:35,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +28: [2023-05-13 03:28:35,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +28: [2023-05-13 03:28:35,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:35,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +30: [2023-05-13 03:28:35,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +10: [2023-05-13 03:28:35,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +13: [2023-05-13 03:28:35,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +13: [2023-05-13 03:28:35,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +13: [2023-05-13 03:28:35,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +30: [2023-05-13 03:28:35,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +10: [2023-05-13 03:28:35,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +11: [2023-05-13 03:28:35,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +10: [2023-05-13 03:28:36,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +10: [2023-05-13 03:28:36,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +10: [2023-05-13 03:28:36,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +10: [2023-05-13 03:28:36,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +11: [2023-05-13 03:28:36,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +15: [2023-05-13 03:28:36,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +28: [2023-05-13 03:28:36,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +12: [2023-05-13 03:28:36,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +12: [2023-05-13 03:28:36,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +12: [2023-05-13 03:28:36,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +12: [2023-05-13 03:28:36,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +12: [2023-05-13 03:28:36,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +12: [2023-05-13 03:28:36,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +12: [2023-05-13 03:28:36,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +12: [2023-05-13 03:28:36,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +29: [2023-05-13 03:28:36,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +29: [2023-05-13 03:28:36,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +17: [2023-05-13 03:28:36,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +17: [2023-05-13 03:28:36,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +17: [2023-05-13 03:28:36,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +29: [2023-05-13 03:28:36,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +17: [2023-05-13 03:28:36,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +17: [2023-05-13 03:28:36,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +17: [2023-05-13 03:28:36,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +17: [2023-05-13 03:28:36,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +29: [2023-05-13 03:28:36,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +17: [2023-05-13 03:28:36,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +29: [2023-05-13 03:28:36,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +29: [2023-05-13 03:28:36,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +29: [2023-05-13 03:28:36,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +29: [2023-05-13 03:28:36,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +29: [2023-05-13 03:28:36,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 8: [2023-05-13 03:28:36,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +29: [2023-05-13 03:28:36,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +17: [2023-05-13 03:28:36,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +12: [2023-05-13 03:28:36,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +12: [2023-05-13 03:28:36,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +12: [2023-05-13 03:28:36,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +12: [2023-05-13 03:28:36,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +12: [2023-05-13 03:28:36,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +12: [2023-05-13 03:28:36,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +12: [2023-05-13 03:28:36,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 8: [2023-05-13 03:28:36,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +12: [2023-05-13 03:28:36,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 8: [2023-05-13 03:28:36,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +17: [2023-05-13 03:28:36,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +29: [2023-05-13 03:28:36,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +29: [2023-05-13 03:28:36,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +29: [2023-05-13 03:28:36,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +29: [2023-05-13 03:28:36,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +29: [2023-05-13 03:28:36,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +22: [2023-05-13 03:28:36,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +22: [2023-05-13 03:28:36,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +17: [2023-05-13 03:28:36,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +17: [2023-05-13 03:28:36,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +22: [2023-05-13 03:28:36,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +22: [2023-05-13 03:28:36,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +17: [2023-05-13 03:28:36,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +22: [2023-05-13 03:28:36,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +22: [2023-05-13 03:28:36,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +22: [2023-05-13 03:28:36,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +29: [2023-05-13 03:28:36,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +22: [2023-05-13 03:28:36,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +17: [2023-05-13 03:28:36,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +17: [2023-05-13 03:28:36,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 8: [2023-05-13 03:28:36,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +17: [2023-05-13 03:28:36,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 8: [2023-05-13 03:28:36,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 7: [2023-05-13 03:28:36,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +15: [2023-05-13 03:28:36,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 8: [2023-05-13 03:28:36,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +28: [2023-05-13 03:28:36,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +22: [2023-05-13 03:28:36,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +22: [2023-05-13 03:28:36,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +11: [2023-05-13 03:28:36,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +11: [2023-05-13 03:28:36,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +11: [2023-05-13 03:28:36,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +15: [2023-05-13 03:28:36,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +18: [2023-05-13 03:28:36,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +22: [2023-05-13 03:28:36,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +22: [2023-05-13 03:28:36,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +18: [2023-05-13 03:28:36,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +18: [2023-05-13 03:28:36,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +18: [2023-05-13 03:28:36,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +18: [2023-05-13 03:28:36,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +18: [2023-05-13 03:28:36,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +18: [2023-05-13 03:28:36,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +11: [2023-05-13 03:28:36,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +22: [2023-05-13 03:28:36,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +18: [2023-05-13 03:28:36,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +15: [2023-05-13 03:28:36,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +22: [2023-05-13 03:28:36,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +28: [2023-05-13 03:28:36,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +11: [2023-05-13 03:28:36,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +11: [2023-05-13 03:28:36,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +11: [2023-05-13 03:28:36,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +22: [2023-05-13 03:28:36,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +22: [2023-05-13 03:28:36,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +18: [2023-05-13 03:28:36,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 7: [2023-05-13 03:28:36,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 7: [2023-05-13 03:28:36,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +18: [2023-05-13 03:28:36,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +18: [2023-05-13 03:28:36,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +18: [2023-05-13 03:28:36,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +18: [2023-05-13 03:28:36,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +18: [2023-05-13 03:28:36,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +18: [2023-05-13 03:28:36,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +18: [2023-05-13 03:28:36,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +31: [2023-05-13 03:28:36,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +28: [2023-05-13 03:28:36,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +31: [2023-05-13 03:28:36,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +28: [2023-05-13 03:28:36,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 0: [2023-05-13 03:28:36,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +28: [2023-05-13 03:28:36,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +31: [2023-05-13 03:28:36,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +31: [2023-05-13 03:28:36,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +31: [2023-05-13 03:28:36,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +31: [2023-05-13 03:28:36,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +31: [2023-05-13 03:28:36,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +28: [2023-05-13 03:28:36,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +31: [2023-05-13 03:28:36,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +28: [2023-05-13 03:28:36,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +28: [2023-05-13 03:28:36,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +15: [2023-05-13 03:28:36,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +15: [2023-05-13 03:28:36,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 0: [2023-05-13 03:28:36,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 0: [2023-05-13 03:28:36,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 0: [2023-05-13 03:28:36,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 0: [2023-05-13 03:28:36,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 0: [2023-05-13 03:28:36,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 0: [2023-05-13 03:28:36,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +15: [2023-05-13 03:28:36,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +15: [2023-05-13 03:28:36,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 0: [2023-05-13 03:28:36,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +31: [2023-05-13 03:28:36,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +31: [2023-05-13 03:28:36,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 0: [2023-05-13 03:28:36,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +31: [2023-05-13 03:28:36,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +28: [2023-05-13 03:28:36,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +15: [2023-05-13 03:28:36,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 0: [2023-05-13 03:28:36,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 0: [2023-05-13 03:28:36,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 0: [2023-05-13 03:28:36,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +31: [2023-05-13 03:28:36,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 0: [2023-05-13 03:28:36,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 0: [2023-05-13 03:28:36,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +26: [2023-05-13 03:28:36,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +26: [2023-05-13 03:28:36,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +26: [2023-05-13 03:28:36,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +26: [2023-05-13 03:28:36,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +26: [2023-05-13 03:28:36,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +26: [2023-05-13 03:28:36,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 0: [2023-05-13 03:28:36,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +26: [2023-05-13 03:28:36,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +31: [2023-05-13 03:28:36,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +26: [2023-05-13 03:28:36,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 0: [2023-05-13 03:28:36,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +31: [2023-05-13 03:28:36,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +31: [2023-05-13 03:28:36,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +15: [2023-05-13 03:28:36,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +31: [2023-05-13 03:28:36,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +15: [2023-05-13 03:28:36,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +14: [2023-05-13 03:28:36,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +14: [2023-05-13 03:28:36,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +14: [2023-05-13 03:28:36,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +17: [2023-05-13 03:28:36,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +14: [2023-05-13 03:28:36,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +14: [2023-05-13 03:28:36,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +14: [2023-05-13 03:28:36,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +14: [2023-05-13 03:28:36,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +11: [2023-05-13 03:28:36,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +29: [2023-05-13 03:28:36,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +29: [2023-05-13 03:28:36,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +26: [2023-05-13 03:28:36,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +26: [2023-05-13 03:28:36,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +26: [2023-05-13 03:28:36,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +26: [2023-05-13 03:28:36,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +26: [2023-05-13 03:28:36,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +25: [2023-05-13 03:28:36,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +25: [2023-05-13 03:28:36,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 7: [2023-05-13 03:28:36,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +26: [2023-05-13 03:28:36,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +14: [2023-05-13 03:28:36,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +11: [2023-05-13 03:28:36,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 8: [2023-05-13 03:28:36,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +25: [2023-05-13 03:28:36,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +25: [2023-05-13 03:28:36,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +25: [2023-05-13 03:28:36,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +25: [2023-05-13 03:28:36,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +25: [2023-05-13 03:28:36,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +26: [2023-05-13 03:28:36,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +26: [2023-05-13 03:28:36,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +25: [2023-05-13 03:28:36,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +11: [2023-05-13 03:28:36,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +11: [2023-05-13 03:28:36,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +11: [2023-05-13 03:28:36,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +11: [2023-05-13 03:28:36,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +25: [2023-05-13 03:28:36,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +14: [2023-05-13 03:28:36,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +11: [2023-05-13 03:28:36,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +25: [2023-05-13 03:28:36,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +14: [2023-05-13 03:28:36,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +14: [2023-05-13 03:28:36,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +14: [2023-05-13 03:28:36,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +12: [2023-05-13 03:28:36,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +25: [2023-05-13 03:28:36,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +12: [2023-05-13 03:28:36,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +12: [2023-05-13 03:28:36,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +12: [2023-05-13 03:28:36,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +12: [2023-05-13 03:28:36,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +25: [2023-05-13 03:28:36,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +25: [2023-05-13 03:28:36,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +25: [2023-05-13 03:28:36,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +25: [2023-05-13 03:28:36,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +25: [2023-05-13 03:28:36,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +22: [2023-05-13 03:28:36,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +22: [2023-05-13 03:28:36,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +15: [2023-05-13 03:28:36,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +15: [2023-05-13 03:28:36,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +18: [2023-05-13 03:28:36,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +17: [2023-05-13 03:28:36,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 8: [2023-05-13 03:28:36,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +28: [2023-05-13 03:28:36,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +28: [2023-05-13 03:28:36,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +15: [2023-05-13 03:28:36,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +29: [2023-05-13 03:28:36,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +28: [2023-05-13 03:28:36,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +29: [2023-05-13 03:28:36,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +28: [2023-05-13 03:28:36,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +15: [2023-05-13 03:28:36,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +15: [2023-05-13 03:28:36,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +29: [2023-05-13 03:28:36,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +29: [2023-05-13 03:28:36,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +28: [2023-05-13 03:28:36,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +28: [2023-05-13 03:28:36,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 8: [2023-05-13 03:28:36,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +12: [2023-05-13 03:28:36,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +12: [2023-05-13 03:28:36,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +12: [2023-05-13 03:28:36,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +29: [2023-05-13 03:28:36,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +29: [2023-05-13 03:28:36,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +29: [2023-05-13 03:28:36,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +29: [2023-05-13 03:28:36,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +31: [2023-05-13 03:28:36,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +18: [2023-05-13 03:28:36,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +17: [2023-05-13 03:28:36,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +17: [2023-05-13 03:28:36,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +18: [2023-05-13 03:28:36,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +18: [2023-05-13 03:28:36,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +17: [2023-05-13 03:28:36,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +17: [2023-05-13 03:28:36,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +12: [2023-05-13 03:28:36,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +12: [2023-05-13 03:28:36,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +12: [2023-05-13 03:28:36,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +12: [2023-05-13 03:28:36,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +22: [2023-05-13 03:28:36,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +22: [2023-05-13 03:28:36,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +17: [2023-05-13 03:28:36,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +12: [2023-05-13 03:28:36,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 8: [2023-05-13 03:28:36,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +18: [2023-05-13 03:28:36,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +17: [2023-05-13 03:28:36,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +18: [2023-05-13 03:28:36,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +22: [2023-05-13 03:28:36,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +22: [2023-05-13 03:28:36,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +22: [2023-05-13 03:28:36,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +22: [2023-05-13 03:28:36,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 0: [2023-05-13 03:28:36,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +22: [2023-05-13 03:28:36,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +22: [2023-05-13 03:28:36,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +31: [2023-05-13 03:28:36,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +18: [2023-05-13 03:28:36,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +18: [2023-05-13 03:28:36,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 9: [2023-05-13 03:28:36,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 9: [2023-05-13 03:28:36,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 9: [2023-05-13 03:28:36,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 9: [2023-05-13 03:28:36,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 9: [2023-05-13 03:28:36,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 9: [2023-05-13 03:28:36,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 9: [2023-05-13 03:28:36,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 9: [2023-05-13 03:28:36,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +18: [2023-05-13 03:28:36,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +17: [2023-05-13 03:28:36,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +26: [2023-05-13 03:28:36,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +26: [2023-05-13 03:28:36,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +12: [2023-05-13 03:28:36,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +29: [2023-05-13 03:28:36,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +12: [2023-05-13 03:28:36,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 9: [2023-05-13 03:28:36,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +31: [2023-05-13 03:28:36,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +12: [2023-05-13 03:28:36,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +29: [2023-05-13 03:28:36,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +18: [2023-05-13 03:28:36,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +18: [2023-05-13 03:28:36,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +18: [2023-05-13 03:28:36,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +26: [2023-05-13 03:28:36,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +26: [2023-05-13 03:28:36,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +31: [2023-05-13 03:28:36,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 9: [2023-05-13 03:28:36,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 9: [2023-05-13 03:28:36,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +29: [2023-05-13 03:28:36,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 9: [2023-05-13 03:28:36,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +14: [2023-05-13 03:28:36,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 9: [2023-05-13 03:28:36,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +29: [2023-05-13 03:28:36,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +21: [2023-05-13 03:28:36,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +21: [2023-05-13 03:28:36,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +29: [2023-05-13 03:28:36,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 9: [2023-05-13 03:28:36,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +29: [2023-05-13 03:28:36,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 9: [2023-05-13 03:28:36,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +22: [2023-05-13 03:28:36,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 1: [2023-05-13 03:28:36,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 1: [2023-05-13 03:28:36,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +21: [2023-05-13 03:28:36,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +26: [2023-05-13 03:28:36,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 9: [2023-05-13 03:28:36,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +21: [2023-05-13 03:28:36,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +21: [2023-05-13 03:28:36,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 1: [2023-05-13 03:28:36,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 1: [2023-05-13 03:28:36,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +21: [2023-05-13 03:28:36,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +21: [2023-05-13 03:28:36,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 1: [2023-05-13 03:28:36,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 1: [2023-05-13 03:28:36,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +21: [2023-05-13 03:28:36,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 1: [2023-05-13 03:28:36,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +25: [2023-05-13 03:28:36,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +25: [2023-05-13 03:28:36,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +25: [2023-05-13 03:28:36,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 1: [2023-05-13 03:28:36,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 0: [2023-05-13 03:28:36,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +31: [2023-05-13 03:28:36,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +17: [2023-05-13 03:28:36,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +22: [2023-05-13 03:28:36,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +17: [2023-05-13 03:28:36,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +21: [2023-05-13 03:28:36,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +21: [2023-05-13 03:28:36,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +21: [2023-05-13 03:28:36,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +31: [2023-05-13 03:28:36,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +31: [2023-05-13 03:28:36,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +31: [2023-05-13 03:28:36,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 1: [2023-05-13 03:28:36,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 8: [2023-05-13 03:28:36,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +31: [2023-05-13 03:28:36,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +31: [2023-05-13 03:28:36,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +17: [2023-05-13 03:28:36,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 8: [2023-05-13 03:28:36,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 8: [2023-05-13 03:28:36,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 1: [2023-05-13 03:28:36,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +25: [2023-05-13 03:28:36,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 1: [2023-05-13 03:28:36,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 0: [2023-05-13 03:28:36,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +21: [2023-05-13 03:28:36,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +18: [2023-05-13 03:28:36,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 1: [2023-05-13 03:28:36,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 8: [2023-05-13 03:28:36,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 1: [2023-05-13 03:28:36,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 1: [2023-05-13 03:28:36,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +17: [2023-05-13 03:28:36,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 1: [2023-05-13 03:28:36,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +26: [2023-05-13 03:28:36,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +26: [2023-05-13 03:28:36,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 1: [2023-05-13 03:28:36,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +14: [2023-05-13 03:28:36,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +21: [2023-05-13 03:28:36,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +21: [2023-05-13 03:28:36,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +18: [2023-05-13 03:28:36,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +17: [2023-05-13 03:28:36,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +21: [2023-05-13 03:28:36,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +21: [2023-05-13 03:28:36,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +22: [2023-05-13 03:28:36,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +26: [2023-05-13 03:28:36,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +26: [2023-05-13 03:28:36,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +22: [2023-05-13 03:28:36,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +14: [2023-05-13 03:28:36,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +14: [2023-05-13 03:28:36,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +14: [2023-05-13 03:28:36,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +22: [2023-05-13 03:28:36,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 0: [2023-05-13 03:28:36,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 0: [2023-05-13 03:28:36,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 0: [2023-05-13 03:28:36,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 0: [2023-05-13 03:28:36,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 0: [2023-05-13 03:28:36,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 0: [2023-05-13 03:28:36,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +18: [2023-05-13 03:28:36,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +17: [2023-05-13 03:28:36,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +22: [2023-05-13 03:28:36,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +18: [2023-05-13 03:28:36,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +25: [2023-05-13 03:28:36,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +17: [2023-05-13 03:28:36,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +25: [2023-05-13 03:28:36,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +25: [2023-05-13 03:28:36,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +26: [2023-05-13 03:28:36,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +25: [2023-05-13 03:28:36,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +31: [2023-05-13 03:28:36,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +26: [2023-05-13 03:28:36,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +26: [2023-05-13 03:28:36,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +23: [2023-05-13 03:28:36,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +25: [2023-05-13 03:28:36,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +25: [2023-05-13 03:28:36,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +26: [2023-05-13 03:28:36,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +23: [2023-05-13 03:28:36,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +25: [2023-05-13 03:28:36,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +23: [2023-05-13 03:28:36,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +16: [2023-05-13 03:28:36,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +16: [2023-05-13 03:28:36,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +23: [2023-05-13 03:28:36,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +23: [2023-05-13 03:28:36,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +23: [2023-05-13 03:28:36,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +23: [2023-05-13 03:28:36,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +23: [2023-05-13 03:28:36,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +25: [2023-05-13 03:28:36,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 4: [2023-05-13 03:28:36,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 4: [2023-05-13 03:28:36,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +31: [2023-05-13 03:28:36,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +16: [2023-05-13 03:28:36,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +16: [2023-05-13 03:28:36,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +16: [2023-05-13 03:28:36,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +16: [2023-05-13 03:28:36,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +16: [2023-05-13 03:28:36,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +16: [2023-05-13 03:28:36,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +31: [2023-05-13 03:28:36,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +23: [2023-05-13 03:28:36,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +23: [2023-05-13 03:28:36,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 4: [2023-05-13 03:28:36,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 4: [2023-05-13 03:28:36,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +31: [2023-05-13 03:28:36,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 4: [2023-05-13 03:28:36,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 0: [2023-05-13 03:28:36,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 4: [2023-05-13 03:28:36,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 4: [2023-05-13 03:28:36,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 4: [2023-05-13 03:28:36,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +24: [2023-05-13 03:28:36,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +24: [2023-05-13 03:28:36,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +24: [2023-05-13 03:28:36,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +23: [2023-05-13 03:28:36,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +24: [2023-05-13 03:28:36,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +24: [2023-05-13 03:28:36,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +24: [2023-05-13 03:28:36,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +24: [2023-05-13 03:28:36,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +24: [2023-05-13 03:28:36,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +31: [2023-05-13 03:28:36,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +16: [2023-05-13 03:28:36,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +16: [2023-05-13 03:28:36,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +16: [2023-05-13 03:28:36,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +31: [2023-05-13 03:28:36,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 9: [2023-05-13 03:28:36,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +14: [2023-05-13 03:28:36,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 4: [2023-05-13 03:28:36,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 4: [2023-05-13 03:28:36,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +26: [2023-05-13 03:28:36,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +26: [2023-05-13 03:28:36,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +16: [2023-05-13 03:28:36,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +16: [2023-05-13 03:28:36,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +16: [2023-05-13 03:28:36,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 4: [2023-05-13 03:28:36,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +23: [2023-05-13 03:28:36,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +23: [2023-05-13 03:28:36,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +16: [2023-05-13 03:28:36,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +23: [2023-05-13 03:28:36,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +16: [2023-05-13 03:28:36,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 4: [2023-05-13 03:28:36,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +23: [2023-05-13 03:28:36,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +23: [2023-05-13 03:28:36,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +24: [2023-05-13 03:28:36,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +24: [2023-05-13 03:28:36,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +14: [2023-05-13 03:28:36,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +24: [2023-05-13 03:28:36,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 4: [2023-05-13 03:28:36,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 4: [2023-05-13 03:28:36,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +24: [2023-05-13 03:28:36,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 4: [2023-05-13 03:28:36,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +14: [2023-05-13 03:28:36,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 4: [2023-05-13 03:28:36,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +14: [2023-05-13 03:28:36,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 0: [2023-05-13 03:28:36,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +24: [2023-05-13 03:28:36,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +24: [2023-05-13 03:28:36,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +24: [2023-05-13 03:28:36,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +24: [2023-05-13 03:28:36,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +26: [2023-05-13 03:28:36,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 0: [2023-05-13 03:28:36,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +25: [2023-05-13 03:28:36,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 0: [2023-05-13 03:28:36,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 0: [2023-05-13 03:28:36,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 0: [2023-05-13 03:28:36,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 0: [2023-05-13 03:28:36,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +21: [2023-05-13 03:28:36,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +25: [2023-05-13 03:28:36,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +25: [2023-05-13 03:28:36,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +25: [2023-05-13 03:28:36,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 1: [2023-05-13 03:28:36,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 3: [2023-05-13 03:28:36,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +19: [2023-05-13 03:28:36,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +19: [2023-05-13 03:28:36,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 3: [2023-05-13 03:28:36,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 5: [2023-05-13 03:28:36,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 5: [2023-05-13 03:28:36,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 5: [2023-05-13 03:28:36,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 5: [2023-05-13 03:28:36,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 5: [2023-05-13 03:28:36,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 5: [2023-05-13 03:28:36,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 5: [2023-05-13 03:28:36,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 5: [2023-05-13 03:28:36,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +19: [2023-05-13 03:28:36,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +19: [2023-05-13 03:28:36,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +19: [2023-05-13 03:28:36,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +19: [2023-05-13 03:28:36,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +19: [2023-05-13 03:28:36,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +19: [2023-05-13 03:28:36,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 1: [2023-05-13 03:28:36,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +20: [2023-05-13 03:28:36,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +20: [2023-05-13 03:28:36,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 3: [2023-05-13 03:28:36,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 3: [2023-05-13 03:28:36,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 3: [2023-05-13 03:28:36,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 3: [2023-05-13 03:28:36,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 3: [2023-05-13 03:28:36,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 3: [2023-05-13 03:28:36,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +21: [2023-05-13 03:28:36,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 9: [2023-05-13 03:28:36,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 5: [2023-05-13 03:28:36,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 5: [2023-05-13 03:28:36,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 5: [2023-05-13 03:28:36,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +20: [2023-05-13 03:28:36,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +20: [2023-05-13 03:28:36,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +20: [2023-05-13 03:28:36,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +20: [2023-05-13 03:28:36,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +20: [2023-05-13 03:28:36,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +20: [2023-05-13 03:28:36,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 5: [2023-05-13 03:28:36,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +19: [2023-05-13 03:28:36,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +21: [2023-05-13 03:28:36,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +19: [2023-05-13 03:28:36,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +19: [2023-05-13 03:28:36,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 5: [2023-05-13 03:28:36,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +19: [2023-05-13 03:28:36,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +20: [2023-05-13 03:28:36,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +20: [2023-05-13 03:28:36,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 5: [2023-05-13 03:28:36,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +19: [2023-05-13 03:28:36,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +19: [2023-05-13 03:28:36,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +19: [2023-05-13 03:28:36,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 5: [2023-05-13 03:28:36,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +21: [2023-05-13 03:28:36,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 1: [2023-05-13 03:28:36,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 1: [2023-05-13 03:28:36,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 5: [2023-05-13 03:28:36,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +19: [2023-05-13 03:28:36,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 1: [2023-05-13 03:28:36,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 1: [2023-05-13 03:28:36,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +20: [2023-05-13 03:28:36,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +20: [2023-05-13 03:28:36,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +21: [2023-05-13 03:28:36,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +20: [2023-05-13 03:28:36,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 9: [2023-05-13 03:28:36,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 9: [2023-05-13 03:28:36,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 1: [2023-05-13 03:28:36,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 1: [2023-05-13 03:28:36,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 9: [2023-05-13 03:28:36,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +20: [2023-05-13 03:28:36,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +20: [2023-05-13 03:28:36,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... +20: [2023-05-13 03:28:36,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt... + 9: [2023-05-13 03:28:36,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 9: [2023-05-13 03:28:36,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 9: [2023-05-13 03:28:36,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 9: [2023-05-13 03:28:36,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +21: [2023-05-13 03:28:36,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 1: [2023-05-13 03:28:36,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +21: [2023-05-13 03:28:36,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +21: [2023-05-13 03:28:36,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +21: [2023-05-13 03:28:36,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 1: [2023-05-13 03:28:36,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +23: [2023-05-13 03:28:36,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +23: [2023-05-13 03:28:36,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +16: [2023-05-13 03:28:36,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +23: [2023-05-13 03:28:36,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 1: [2023-05-13 03:28:36,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 1: [2023-05-13 03:28:36,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 4: [2023-05-13 03:28:36,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 4: [2023-05-13 03:28:36,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 4: [2023-05-13 03:28:36,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 1: [2023-05-13 03:28:36,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 1: [2023-05-13 03:28:36,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +16: [2023-05-13 03:28:36,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +16: [2023-05-13 03:28:36,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 1: [2023-05-13 03:28:36,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +24: [2023-05-13 03:28:36,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +24: [2023-05-13 03:28:36,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +24: [2023-05-13 03:28:36,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +24: [2023-05-13 03:28:36,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 1: [2023-05-13 03:28:36,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 4: [2023-05-13 03:28:36,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 4: [2023-05-13 03:28:36,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 4: [2023-05-13 03:28:36,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 4: [2023-05-13 03:28:36,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +16: [2023-05-13 03:28:36,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +16: [2023-05-13 03:28:36,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +16: [2023-05-13 03:28:36,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +16: [2023-05-13 03:28:36,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 4: [2023-05-13 03:28:36,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +16: [2023-05-13 03:28:36,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 9: [2023-05-13 03:28:36,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 9: [2023-05-13 03:28:36,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 9: [2023-05-13 03:28:36,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 9: [2023-05-13 03:28:36,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 5: [2023-05-13 03:28:36,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +23: [2023-05-13 03:28:36,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +16: [2023-05-13 03:28:36,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +23: [2023-05-13 03:28:36,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +24: [2023-05-13 03:28:36,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +24: [2023-05-13 03:28:36,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +24: [2023-05-13 03:28:36,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +24: [2023-05-13 03:28:36,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 9: [2023-05-13 03:28:36,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 9: [2023-05-13 03:28:36,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 9: [2023-05-13 03:28:36,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +23: [2023-05-13 03:28:36,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +23: [2023-05-13 03:28:36,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +23: [2023-05-13 03:28:36,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +23: [2023-05-13 03:28:36,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +23: [2023-05-13 03:28:36,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +23: [2023-05-13 03:28:36,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +20: [2023-05-13 03:28:36,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +20: [2023-05-13 03:28:36,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +19: [2023-05-13 03:28:36,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 5: [2023-05-13 03:28:36,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 5: [2023-05-13 03:28:36,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 5: [2023-05-13 03:28:36,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 4: [2023-05-13 03:28:36,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +19: [2023-05-13 03:28:36,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +19: [2023-05-13 03:28:36,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 4: [2023-05-13 03:28:36,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +21: [2023-05-13 03:28:36,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +21: [2023-05-13 03:28:36,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +21: [2023-05-13 03:28:36,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +21: [2023-05-13 03:28:36,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +21: [2023-05-13 03:28:36,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +21: [2023-05-13 03:28:36,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +21: [2023-05-13 03:28:36,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 4: [2023-05-13 03:28:36,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 5: [2023-05-13 03:28:36,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 5: [2023-05-13 03:28:36,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 5: [2023-05-13 03:28:36,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 5: [2023-05-13 03:28:36,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +16: [2023-05-13 03:28:36,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +16: [2023-05-13 03:28:36,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +19: [2023-05-13 03:28:36,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +19: [2023-05-13 03:28:36,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +19: [2023-05-13 03:28:36,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +19: [2023-05-13 03:28:36,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +19: [2023-05-13 03:28:36,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 4: [2023-05-13 03:28:36,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 4: [2023-05-13 03:28:36,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +16: [2023-05-13 03:28:36,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +24: [2023-05-13 03:28:36,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +24: [2023-05-13 03:28:36,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +16: [2023-05-13 03:28:36,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +24: [2023-05-13 03:28:36,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +24: [2023-05-13 03:28:36,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 5: [2023-05-13 03:28:36,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +16: [2023-05-13 03:28:36,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +16: [2023-05-13 03:28:36,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +16: [2023-05-13 03:28:36,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 4: [2023-05-13 03:28:36,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 4: [2023-05-13 03:28:36,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 3: [2023-05-13 03:28:36,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 4: [2023-05-13 03:28:36,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +20: [2023-05-13 03:28:36,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +20: [2023-05-13 03:28:36,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +20: [2023-05-13 03:28:36,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +20: [2023-05-13 03:28:36,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +20: [2023-05-13 03:28:36,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +24: [2023-05-13 03:28:36,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +20: [2023-05-13 03:28:36,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +20: [2023-05-13 03:28:36,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +20: [2023-05-13 03:28:36,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +23: [2023-05-13 03:28:36,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 5: [2023-05-13 03:28:36,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +23: [2023-05-13 03:28:36,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 5: [2023-05-13 03:28:36,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +19: [2023-05-13 03:28:36,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +24: [2023-05-13 03:28:36,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +24: [2023-05-13 03:28:36,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +24: [2023-05-13 03:28:36,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +23: [2023-05-13 03:28:36,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +23: [2023-05-13 03:28:36,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 5: [2023-05-13 03:28:36,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +23: [2023-05-13 03:28:36,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +19: [2023-05-13 03:28:36,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. +19: [2023-05-13 03:28:36,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_31-model_00-model_states.pt. + 5: [2023-05-13 03:28:36,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 5: [2023-05-13 03:28:36,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 5: [2023-05-13 03:28:36,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 5: [2023-05-13 03:28:36,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +19: [2023-05-13 03:28:36,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +19: [2023-05-13 03:28:36,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +19: [2023-05-13 03:28:36,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +19: [2023-05-13 03:28:36,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +19: [2023-05-13 03:28:36,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +20: [2023-05-13 03:28:36,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +20: [2023-05-13 03:28:36,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +20: [2023-05-13 03:28:36,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +20: [2023-05-13 03:28:36,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +20: [2023-05-13 03:28:36,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +20: [2023-05-13 03:28:36,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:36,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +30: [2023-05-13 03:28:36,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +30: [2023-05-13 03:28:36,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +30: [2023-05-13 03:28:36,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +30: [2023-05-13 03:28:36,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +30: [2023-05-13 03:28:36,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +30: [2023-05-13 03:28:36,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +30: [2023-05-13 03:28:36,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +30: [2023-05-13 03:28:36,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +30: [2023-05-13 03:28:36,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +30: [2023-05-13 03:28:36,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +30: [2023-05-13 03:28:36,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +30: [2023-05-13 03:28:36,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +30: [2023-05-13 03:28:36,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +30: [2023-05-13 03:28:36,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +30: [2023-05-13 03:28:36,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +30: [2023-05-13 03:28:36,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +30: [2023-05-13 03:28:36,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +30: [2023-05-13 03:28:36,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +30: [2023-05-13 03:28:36,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +30: [2023-05-13 03:28:36,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +30: [2023-05-13 03:28:36,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +30: [2023-05-13 03:28:36,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +30: [2023-05-13 03:28:36,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +30: [2023-05-13 03:28:36,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +30: [2023-05-13 03:28:36,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +30: [2023-05-13 03:28:36,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +30: [2023-05-13 03:28:36,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +30: [2023-05-13 03:28:36,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +30: [2023-05-13 03:28:36,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +30: [2023-05-13 03:28:36,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +30: [2023-05-13 03:28:36,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +30: [2023-05-13 03:28:36,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:36,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +11: [2023-05-13 03:28:36,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +11: [2023-05-13 03:28:36,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +11: [2023-05-13 03:28:36,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +11: [2023-05-13 03:28:36,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +11: [2023-05-13 03:28:36,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +11: [2023-05-13 03:28:36,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +11: [2023-05-13 03:28:36,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +22: [2023-05-13 03:28:36,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +22: [2023-05-13 03:28:36,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +21: [2023-05-13 03:28:36,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +21: [2023-05-13 03:28:36,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +21: [2023-05-13 03:28:36,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +22: [2023-05-13 03:28:36,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +22: [2023-05-13 03:28:36,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +11: [2023-05-13 03:28:36,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +22: [2023-05-13 03:28:36,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +22: [2023-05-13 03:28:36,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +22: [2023-05-13 03:28:36,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +21: [2023-05-13 03:28:36,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +21: [2023-05-13 03:28:36,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +21: [2023-05-13 03:28:36,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +21: [2023-05-13 03:28:36,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +22: [2023-05-13 03:28:36,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +21: [2023-05-13 03:28:36,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +21: [2023-05-13 03:28:36,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +22: [2023-05-13 03:28:36,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +21: [2023-05-13 03:28:36,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +21: [2023-05-13 03:28:36,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +22: [2023-05-13 03:28:36,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +22: [2023-05-13 03:28:36,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +29: [2023-05-13 03:28:36,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +29: [2023-05-13 03:28:36,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +29: [2023-05-13 03:28:36,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +29: [2023-05-13 03:28:36,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:36,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:36,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +21: [2023-05-13 03:28:36,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +29: [2023-05-13 03:28:36,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +29: [2023-05-13 03:28:36,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +29: [2023-05-13 03:28:36,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +29: [2023-05-13 03:28:36,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +31: [2023-05-13 03:28:36,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +11: [2023-05-13 03:28:36,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:36,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:36,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:36,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:36,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +11: [2023-05-13 03:28:36,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +11: [2023-05-13 03:28:36,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +31: [2023-05-13 03:28:36,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +31: [2023-05-13 03:28:36,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +31: [2023-05-13 03:28:36,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +31: [2023-05-13 03:28:36,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +31: [2023-05-13 03:28:36,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +31: [2023-05-13 03:28:36,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +21: [2023-05-13 03:28:36,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +31: [2023-05-13 03:28:36,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +22: [2023-05-13 03:28:36,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +21: [2023-05-13 03:28:36,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +22: [2023-05-13 03:28:36,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +21: [2023-05-13 03:28:36,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +11: [2023-05-13 03:28:36,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +22: [2023-05-13 03:28:36,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +21: [2023-05-13 03:28:36,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +11: [2023-05-13 03:28:36,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +22: [2023-05-13 03:28:36,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +11: [2023-05-13 03:28:36,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +11: [2023-05-13 03:28:36,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +22: [2023-05-13 03:28:36,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +13: [2023-05-13 03:28:36,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +29: [2023-05-13 03:28:36,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +13: [2023-05-13 03:28:36,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +13: [2023-05-13 03:28:36,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +13: [2023-05-13 03:28:36,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +13: [2023-05-13 03:28:36,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +13: [2023-05-13 03:28:36,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +13: [2023-05-13 03:28:36,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +29: [2023-05-13 03:28:36,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +31: [2023-05-13 03:28:36,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +13: [2023-05-13 03:28:36,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +31: [2023-05-13 03:28:36,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 7: [2023-05-13 03:28:36,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +29: [2023-05-13 03:28:36,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 7: [2023-05-13 03:28:36,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 7: [2023-05-13 03:28:36,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 7: [2023-05-13 03:28:36,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 7: [2023-05-13 03:28:36,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +15: [2023-05-13 03:28:36,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 7: [2023-05-13 03:28:36,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:36,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +15: [2023-05-13 03:28:36,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +15: [2023-05-13 03:28:36,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +15: [2023-05-13 03:28:36,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +15: [2023-05-13 03:28:36,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +15: [2023-05-13 03:28:36,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +15: [2023-05-13 03:28:36,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +15: [2023-05-13 03:28:36,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:36,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +31: [2023-05-13 03:28:36,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +29: [2023-05-13 03:28:36,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +31: [2023-05-13 03:28:36,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +13: [2023-05-13 03:28:36,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +29: [2023-05-13 03:28:36,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +29: [2023-05-13 03:28:36,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +13: [2023-05-13 03:28:36,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +31: [2023-05-13 03:28:36,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +29: [2023-05-13 03:28:36,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +31: [2023-05-13 03:28:36,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +13: [2023-05-13 03:28:36,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +13: [2023-05-13 03:28:36,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +15: [2023-05-13 03:28:36,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +13: [2023-05-13 03:28:36,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +13: [2023-05-13 03:28:36,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +29: [2023-05-13 03:28:36,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +31: [2023-05-13 03:28:36,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +31: [2023-05-13 03:28:36,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +13: [2023-05-13 03:28:36,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +13: [2023-05-13 03:28:36,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +15: [2023-05-13 03:28:36,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +15: [2023-05-13 03:28:36,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +15: [2023-05-13 03:28:36,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +15: [2023-05-13 03:28:36,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +15: [2023-05-13 03:28:36,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +15: [2023-05-13 03:28:36,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +15: [2023-05-13 03:28:36,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +27: [2023-05-13 03:28:36,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +27: [2023-05-13 03:28:36,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +27: [2023-05-13 03:28:36,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +27: [2023-05-13 03:28:36,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +27: [2023-05-13 03:28:36,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +27: [2023-05-13 03:28:36,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +27: [2023-05-13 03:28:36,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +27: [2023-05-13 03:28:36,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +27: [2023-05-13 03:28:36,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +27: [2023-05-13 03:28:36,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +27: [2023-05-13 03:28:36,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +27: [2023-05-13 03:28:36,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +27: [2023-05-13 03:28:36,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +27: [2023-05-13 03:28:36,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +27: [2023-05-13 03:28:36,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +27: [2023-05-13 03:28:36,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +11: [2023-05-13 03:28:36,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +28: [2023-05-13 03:28:36,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +28: [2023-05-13 03:28:36,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +28: [2023-05-13 03:28:36,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +28: [2023-05-13 03:28:36,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +28: [2023-05-13 03:28:36,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +28: [2023-05-13 03:28:36,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +28: [2023-05-13 03:28:36,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +28: [2023-05-13 03:28:36,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +21: [2023-05-13 03:28:36,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +21: [2023-05-13 03:28:36,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +21: [2023-05-13 03:28:36,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +22: [2023-05-13 03:28:36,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +22: [2023-05-13 03:28:36,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +28: [2023-05-13 03:28:36,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +22: [2023-05-13 03:28:36,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +29: [2023-05-13 03:28:36,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +29: [2023-05-13 03:28:36,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +31: [2023-05-13 03:28:36,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +31: [2023-05-13 03:28:36,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:36,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:36,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +28: [2023-05-13 03:28:36,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +28: [2023-05-13 03:28:36,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +11: [2023-05-13 03:28:36,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +15: [2023-05-13 03:28:36,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +28: [2023-05-13 03:28:36,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +28: [2023-05-13 03:28:36,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +28: [2023-05-13 03:28:36,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +28: [2023-05-13 03:28:36,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +21: [2023-05-13 03:28:36,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +21: [2023-05-13 03:28:36,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +28: [2023-05-13 03:28:36,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +29: [2023-05-13 03:28:36,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +21: [2023-05-13 03:28:36,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +21: [2023-05-13 03:28:36,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +21: [2023-05-13 03:28:36,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +13: [2023-05-13 03:28:36,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +17: [2023-05-13 03:28:36,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +13: [2023-05-13 03:28:36,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +13: [2023-05-13 03:28:36,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +13: [2023-05-13 03:28:36,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +17: [2023-05-13 03:28:36,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +17: [2023-05-13 03:28:36,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +17: [2023-05-13 03:28:36,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +17: [2023-05-13 03:28:36,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +17: [2023-05-13 03:28:36,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +17: [2023-05-13 03:28:36,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 7: [2023-05-13 03:28:36,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +17: [2023-05-13 03:28:36,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 7: [2023-05-13 03:28:36,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 7: [2023-05-13 03:28:36,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +31: [2023-05-13 03:28:36,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 7: [2023-05-13 03:28:36,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +17: [2023-05-13 03:28:36,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:36,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:36,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:36,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:36,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +21: [2023-05-13 03:28:36,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +21: [2023-05-13 03:28:36,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +21: [2023-05-13 03:28:36,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:36,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +11: [2023-05-13 03:28:36,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:36,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +22: [2023-05-13 03:28:36,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +22: [2023-05-13 03:28:36,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +31: [2023-05-13 03:28:36,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +11: [2023-05-13 03:28:36,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +11: [2023-05-13 03:28:36,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +11: [2023-05-13 03:28:36,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +11: [2023-05-13 03:28:36,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 2: [2023-05-13 03:28:36,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +29: [2023-05-13 03:28:36,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +31: [2023-05-13 03:28:36,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +29: [2023-05-13 03:28:36,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +22: [2023-05-13 03:28:36,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +31: [2023-05-13 03:28:36,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +17: [2023-05-13 03:28:36,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +13: [2023-05-13 03:28:36,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +13: [2023-05-13 03:28:36,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +17: [2023-05-13 03:28:36,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +13: [2023-05-13 03:28:36,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +17: [2023-05-13 03:28:36,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +22: [2023-05-13 03:28:36,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +17: [2023-05-13 03:28:36,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +17: [2023-05-13 03:28:36,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +22: [2023-05-13 03:28:36,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +22: [2023-05-13 03:28:36,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +22: [2023-05-13 03:28:36,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +22: [2023-05-13 03:28:36,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +27: [2023-05-13 03:28:36,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +15: [2023-05-13 03:28:36,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +17: [2023-05-13 03:28:36,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +17: [2023-05-13 03:28:36,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:36,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 7: [2023-05-13 03:28:36,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +29: [2023-05-13 03:28:36,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +13: [2023-05-13 03:28:36,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 7: [2023-05-13 03:28:36,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 7: [2023-05-13 03:28:36,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +15: [2023-05-13 03:28:36,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +29: [2023-05-13 03:28:36,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +29: [2023-05-13 03:28:36,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +29: [2023-05-13 03:28:36,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +29: [2023-05-13 03:28:36,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +31: [2023-05-13 03:28:36,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +31: [2023-05-13 03:28:36,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +31: [2023-05-13 03:28:36,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +31: [2023-05-13 03:28:36,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +29: [2023-05-13 03:28:36,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +14: [2023-05-13 03:28:36,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +21: [2023-05-13 03:28:36,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +21: [2023-05-13 03:28:36,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +13: [2023-05-13 03:28:36,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +13: [2023-05-13 03:28:36,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +13: [2023-05-13 03:28:36,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +13: [2023-05-13 03:28:36,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +31: [2023-05-13 03:28:36,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 7: [2023-05-13 03:28:36,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +15: [2023-05-13 03:28:36,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +15: [2023-05-13 03:28:36,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +15: [2023-05-13 03:28:36,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +15: [2023-05-13 03:28:36,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +15: [2023-05-13 03:28:36,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 7: [2023-05-13 03:28:36,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +21: [2023-05-13 03:28:36,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +21: [2023-05-13 03:28:36,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +21: [2023-05-13 03:28:36,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +14: [2023-05-13 03:28:36,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 7: [2023-05-13 03:28:36,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +28: [2023-05-13 03:28:36,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:36,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +15: [2023-05-13 03:28:36,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:36,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:36,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:36,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +31: [2023-05-13 03:28:36,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +22: [2023-05-13 03:28:36,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +27: [2023-05-13 03:28:36,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +13: [2023-05-13 03:28:36,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +22: [2023-05-13 03:28:36,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +22: [2023-05-13 03:28:36,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +15: [2023-05-13 03:28:36,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +13: [2023-05-13 03:28:36,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +29: [2023-05-13 03:28:36,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +13: [2023-05-13 03:28:36,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 2: [2023-05-13 03:28:36,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +27: [2023-05-13 03:28:36,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +27: [2023-05-13 03:28:36,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +13: [2023-05-13 03:28:36,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +22: [2023-05-13 03:28:36,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +22: [2023-05-13 03:28:36,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 7: [2023-05-13 03:28:36,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +29: [2023-05-13 03:28:36,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +27: [2023-05-13 03:28:36,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +27: [2023-05-13 03:28:36,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +31: [2023-05-13 03:28:36,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:36,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:36,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:36,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:36,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:36,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:36,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:36,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +29: [2023-05-13 03:28:36,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +29: [2023-05-13 03:28:36,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +29: [2023-05-13 03:28:36,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +17: [2023-05-13 03:28:36,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +28: [2023-05-13 03:28:36,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +31: [2023-05-13 03:28:36,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +31: [2023-05-13 03:28:36,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +31: [2023-05-13 03:28:36,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +28: [2023-05-13 03:28:36,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +15: [2023-05-13 03:28:36,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +15: [2023-05-13 03:28:36,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +15: [2023-05-13 03:28:36,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +15: [2023-05-13 03:28:36,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +28: [2023-05-13 03:28:36,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +28: [2023-05-13 03:28:36,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +28: [2023-05-13 03:28:36,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +27: [2023-05-13 03:28:36,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +27: [2023-05-13 03:28:36,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +27: [2023-05-13 03:28:36,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +15: [2023-05-13 03:28:36,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +15: [2023-05-13 03:28:36,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +17: [2023-05-13 03:28:36,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +28: [2023-05-13 03:28:36,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 6: [2023-05-13 03:28:36,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +28: [2023-05-13 03:28:36,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +28: [2023-05-13 03:28:36,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +27: [2023-05-13 03:28:36,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +27: [2023-05-13 03:28:36,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +17: [2023-05-13 03:28:36,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +27: [2023-05-13 03:28:36,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 6: [2023-05-13 03:28:36,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +17: [2023-05-13 03:28:36,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +27: [2023-05-13 03:28:36,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +28: [2023-05-13 03:28:36,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 8: [2023-05-13 03:28:36,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +28: [2023-05-13 03:28:36,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 8: [2023-05-13 03:28:36,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +17: [2023-05-13 03:28:36,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +17: [2023-05-13 03:28:36,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 8: [2023-05-13 03:28:36,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +17: [2023-05-13 03:28:36,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +28: [2023-05-13 03:28:37,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +27: [2023-05-13 03:28:37,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +27: [2023-05-13 03:28:37,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +27: [2023-05-13 03:28:37,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +10: [2023-05-13 03:28:37,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +10: [2023-05-13 03:28:37,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +10: [2023-05-13 03:28:37,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +28: [2023-05-13 03:28:37,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +17: [2023-05-13 03:28:37,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +10: [2023-05-13 03:28:37,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +10: [2023-05-13 03:28:37,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +10: [2023-05-13 03:28:37,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +10: [2023-05-13 03:28:37,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +17: [2023-05-13 03:28:37,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +10: [2023-05-13 03:28:37,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +10: [2023-05-13 03:28:37,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +10: [2023-05-13 03:28:37,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +28: [2023-05-13 03:28:37,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +28: [2023-05-13 03:28:37,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +10: [2023-05-13 03:28:37,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +28: [2023-05-13 03:28:37,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +17: [2023-05-13 03:28:37,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +10: [2023-05-13 03:28:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +10: [2023-05-13 03:28:37,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +10: [2023-05-13 03:28:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +10: [2023-05-13 03:28:37,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +10: [2023-05-13 03:28:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +17: [2023-05-13 03:28:37,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +17: [2023-05-13 03:28:37,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +17: [2023-05-13 03:28:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +17: [2023-05-13 03:28:37,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +17: [2023-05-13 03:28:37,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +17: [2023-05-13 03:28:37,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +10: [2023-05-13 03:28:37,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +10: [2023-05-13 03:28:37,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +10: [2023-05-13 03:28:37,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +10: [2023-05-13 03:28:37,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +10: [2023-05-13 03:28:37,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +10: [2023-05-13 03:28:37,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +10: [2023-05-13 03:28:37,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +10: [2023-05-13 03:28:37,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +10: [2023-05-13 03:28:37,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +10: [2023-05-13 03:28:37,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +10: [2023-05-13 03:28:37,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +10: [2023-05-13 03:28:37,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +10: [2023-05-13 03:28:37,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +10: [2023-05-13 03:28:37,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +10: [2023-05-13 03:28:37,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +10: [2023-05-13 03:28:37,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +21: [2023-05-13 03:28:37,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +21: [2023-05-13 03:28:37,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +21: [2023-05-13 03:28:37,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +21: [2023-05-13 03:28:37,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +21: [2023-05-13 03:28:37,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +21: [2023-05-13 03:28:37,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +21: [2023-05-13 03:28:37,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +21: [2023-05-13 03:28:37,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +22: [2023-05-13 03:28:37,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +22: [2023-05-13 03:28:37,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +21: [2023-05-13 03:28:37,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +21: [2023-05-13 03:28:37,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +21: [2023-05-13 03:28:37,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +22: [2023-05-13 03:28:37,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +22: [2023-05-13 03:28:37,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +22: [2023-05-13 03:28:37,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +22: [2023-05-13 03:28:37,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +22: [2023-05-13 03:28:37,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +22: [2023-05-13 03:28:37,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +21: [2023-05-13 03:28:37,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +21: [2023-05-13 03:28:37,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +21: [2023-05-13 03:28:37,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +21: [2023-05-13 03:28:37,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +22: [2023-05-13 03:28:37,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +27: [2023-05-13 03:28:37,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +22: [2023-05-13 03:28:37,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +27: [2023-05-13 03:28:37,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +27: [2023-05-13 03:28:37,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +21: [2023-05-13 03:28:37,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +27: [2023-05-13 03:28:37,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +27: [2023-05-13 03:28:37,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +27: [2023-05-13 03:28:37,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +27: [2023-05-13 03:28:37,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +27: [2023-05-13 03:28:37,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +27: [2023-05-13 03:28:37,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +31: [2023-05-13 03:28:37,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +31: [2023-05-13 03:28:37,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +22: [2023-05-13 03:28:37,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +22: [2023-05-13 03:28:37,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +13: [2023-05-13 03:28:37,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +22: [2023-05-13 03:28:37,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +22: [2023-05-13 03:28:37,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +22: [2023-05-13 03:28:37,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +22: [2023-05-13 03:28:37,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +13: [2023-05-13 03:28:37,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +31: [2023-05-13 03:28:37,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +31: [2023-05-13 03:28:37,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +31: [2023-05-13 03:28:37,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +31: [2023-05-13 03:28:37,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +31: [2023-05-13 03:28:37,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +31: [2023-05-13 03:28:37,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +13: [2023-05-13 03:28:37,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +31: [2023-05-13 03:28:37,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +31: [2023-05-13 03:28:37,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +13: [2023-05-13 03:28:37,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +13: [2023-05-13 03:28:37,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +27: [2023-05-13 03:28:37,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +13: [2023-05-13 03:28:37,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +27: [2023-05-13 03:28:37,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +27: [2023-05-13 03:28:37,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +27: [2023-05-13 03:28:37,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +27: [2023-05-13 03:28:37,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +27: [2023-05-13 03:28:37,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +14: [2023-05-13 03:28:37,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +14: [2023-05-13 03:28:37,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +29: [2023-05-13 03:28:37,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +29: [2023-05-13 03:28:37,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +14: [2023-05-13 03:28:37,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +14: [2023-05-13 03:28:37,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +31: [2023-05-13 03:28:37,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +14: [2023-05-13 03:28:37,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +14: [2023-05-13 03:28:37,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +14: [2023-05-13 03:28:37,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +27: [2023-05-13 03:28:37,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +14: [2023-05-13 03:28:37,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +29: [2023-05-13 03:28:37,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +29: [2023-05-13 03:28:37,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +29: [2023-05-13 03:28:37,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +29: [2023-05-13 03:28:37,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +29: [2023-05-13 03:28:37,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +29: [2023-05-13 03:28:37,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +31: [2023-05-13 03:28:37,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +31: [2023-05-13 03:28:37,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +14: [2023-05-13 03:28:37,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +31: [2023-05-13 03:28:37,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +31: [2023-05-13 03:28:37,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +31: [2023-05-13 03:28:37,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +29: [2023-05-13 03:28:37,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +29: [2023-05-13 03:28:37,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +14: [2023-05-13 03:28:37,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +15: [2023-05-13 03:28:37,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +15: [2023-05-13 03:28:37,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +15: [2023-05-13 03:28:37,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +15: [2023-05-13 03:28:37,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +15: [2023-05-13 03:28:37,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +15: [2023-05-13 03:28:37,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +15: [2023-05-13 03:28:37,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +15: [2023-05-13 03:28:37,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:37,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +16: [2023-05-13 03:28:37,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:37,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +16: [2023-05-13 03:28:37,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +16: [2023-05-13 03:28:37,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:37,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +16: [2023-05-13 03:28:37,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +16: [2023-05-13 03:28:37,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +16: [2023-05-13 03:28:37,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:37,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:37,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +14: [2023-05-13 03:28:37,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +15: [2023-05-13 03:28:37,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +14: [2023-05-13 03:28:37,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +14: [2023-05-13 03:28:37,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +29: [2023-05-13 03:28:37,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +29: [2023-05-13 03:28:37,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +29: [2023-05-13 03:28:37,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +29: [2023-05-13 03:28:37,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +15: [2023-05-13 03:28:37,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +29: [2023-05-13 03:28:37,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +16: [2023-05-13 03:28:37,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +29: [2023-05-13 03:28:37,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +16: [2023-05-13 03:28:37,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +16: [2023-05-13 03:28:37,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:37,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +15: [2023-05-13 03:28:37,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +16: [2023-05-13 03:28:37,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +16: [2023-05-13 03:28:37,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +16: [2023-05-13 03:28:37,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +15: [2023-05-13 03:28:37,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +15: [2023-05-13 03:28:37,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +16: [2023-05-13 03:28:37,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +15: [2023-05-13 03:28:37,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +15: [2023-05-13 03:28:37,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +15: [2023-05-13 03:28:37,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +23: [2023-05-13 03:28:37,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +23: [2023-05-13 03:28:37,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +23: [2023-05-13 03:28:37,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +23: [2023-05-13 03:28:37,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +23: [2023-05-13 03:28:37,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +23: [2023-05-13 03:28:37,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +23: [2023-05-13 03:28:37,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +23: [2023-05-13 03:28:37,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +23: [2023-05-13 03:28:37,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +23: [2023-05-13 03:28:37,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +18: [2023-05-13 03:28:37,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +18: [2023-05-13 03:28:37,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +18: [2023-05-13 03:28:37,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +18: [2023-05-13 03:28:37,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +18: [2023-05-13 03:28:37,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +18: [2023-05-13 03:28:37,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +18: [2023-05-13 03:28:37,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +18: [2023-05-13 03:28:37,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +23: [2023-05-13 03:28:37,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +23: [2023-05-13 03:28:37,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +18: [2023-05-13 03:28:37,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +23: [2023-05-13 03:28:37,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +23: [2023-05-13 03:28:37,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +18: [2023-05-13 03:28:37,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +18: [2023-05-13 03:28:37,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +23: [2023-05-13 03:28:37,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +23: [2023-05-13 03:28:37,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +18: [2023-05-13 03:28:37,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +21: [2023-05-13 03:28:37,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +21: [2023-05-13 03:28:37,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +21: [2023-05-13 03:28:37,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +18: [2023-05-13 03:28:37,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +18: [2023-05-13 03:28:37,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +18: [2023-05-13 03:28:37,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +18: [2023-05-13 03:28:37,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +21: [2023-05-13 03:28:37,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +22: [2023-05-13 03:28:37,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +22: [2023-05-13 03:28:37,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +27: [2023-05-13 03:28:37,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +31: [2023-05-13 03:28:37,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +31: [2023-05-13 03:28:37,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:37,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +21: [2023-05-13 03:28:37,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +21: [2023-05-13 03:28:37,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +21: [2023-05-13 03:28:37,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +21: [2023-05-13 03:28:37,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +29: [2023-05-13 03:28:37,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +21: [2023-05-13 03:28:37,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +29: [2023-05-13 03:28:37,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +15: [2023-05-13 03:28:37,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +22: [2023-05-13 03:28:37,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +22: [2023-05-13 03:28:37,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +21: [2023-05-13 03:28:37,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +21: [2023-05-13 03:28:37,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +13: [2023-05-13 03:28:37,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +14: [2023-05-13 03:28:37,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +22: [2023-05-13 03:28:37,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +22: [2023-05-13 03:28:37,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +22: [2023-05-13 03:28:37,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +22: [2023-05-13 03:28:37,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:37,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +22: [2023-05-13 03:28:37,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +22: [2023-05-13 03:28:37,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +13: [2023-05-13 03:28:37,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +27: [2023-05-13 03:28:37,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +21: [2023-05-13 03:28:37,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +13: [2023-05-13 03:28:37,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +31: [2023-05-13 03:28:37,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +27: [2023-05-13 03:28:37,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +14: [2023-05-13 03:28:37,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +31: [2023-05-13 03:28:37,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +27: [2023-05-13 03:28:37,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +14: [2023-05-13 03:28:37,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +14: [2023-05-13 03:28:37,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +14: [2023-05-13 03:28:37,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +31: [2023-05-13 03:28:37,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +16: [2023-05-13 03:28:37,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +16: [2023-05-13 03:28:37,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +16: [2023-05-13 03:28:37,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +31: [2023-05-13 03:28:37,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +31: [2023-05-13 03:28:37,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +29: [2023-05-13 03:28:37,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:37,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +31: [2023-05-13 03:28:37,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +31: [2023-05-13 03:28:37,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +31: [2023-05-13 03:28:37,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:37,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +15: [2023-05-13 03:28:37,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:37,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +16: [2023-05-13 03:28:37,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +27: [2023-05-13 03:28:37,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +29: [2023-05-13 03:28:37,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +14: [2023-05-13 03:28:37,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +23: [2023-05-13 03:28:37,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +15: [2023-05-13 03:28:37,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +13: [2023-05-13 03:28:37,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +29: [2023-05-13 03:28:37,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +29: [2023-05-13 03:28:37,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +23: [2023-05-13 03:28:37,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +29: [2023-05-13 03:28:37,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +21: [2023-05-13 03:28:37,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +21: [2023-05-13 03:28:37,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +21: [2023-05-13 03:28:37,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +14: [2023-05-13 03:28:37,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +14: [2023-05-13 03:28:37,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +29: [2023-05-13 03:28:37,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +22: [2023-05-13 03:28:37,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +21: [2023-05-13 03:28:37,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +18: [2023-05-13 03:28:37,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +18: [2023-05-13 03:28:37,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +18: [2023-05-13 03:28:37,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +16: [2023-05-13 03:28:37,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +31: [2023-05-13 03:28:37,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +18: [2023-05-13 03:28:37,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +22: [2023-05-13 03:28:37,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +14: [2023-05-13 03:28:37,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +13: [2023-05-13 03:28:37,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +27: [2023-05-13 03:28:37,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +27: [2023-05-13 03:28:37,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +27: [2023-05-13 03:28:37,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +27: [2023-05-13 03:28:37,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +23: [2023-05-13 03:28:37,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +13: [2023-05-13 03:28:37,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +13: [2023-05-13 03:28:37,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +14: [2023-05-13 03:28:37,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +15: [2023-05-13 03:28:37,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +13: [2023-05-13 03:28:37,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +14: [2023-05-13 03:28:37,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +15: [2023-05-13 03:28:37,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +15: [2023-05-13 03:28:37,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +15: [2023-05-13 03:28:37,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +15: [2023-05-13 03:28:37,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +22: [2023-05-13 03:28:37,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +22: [2023-05-13 03:28:37,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +22: [2023-05-13 03:28:37,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +14: [2023-05-13 03:28:37,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +22: [2023-05-13 03:28:37,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +29: [2023-05-13 03:28:37,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +29: [2023-05-13 03:28:37,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:37,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +27: [2023-05-13 03:28:37,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +27: [2023-05-13 03:28:37,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +31: [2023-05-13 03:28:37,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +18: [2023-05-13 03:28:37,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +18: [2023-05-13 03:28:37,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +18: [2023-05-13 03:28:37,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +23: [2023-05-13 03:28:37,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +18: [2023-05-13 03:28:37,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +23: [2023-05-13 03:28:37,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +15: [2023-05-13 03:28:37,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:37,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +23: [2023-05-13 03:28:37,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +23: [2023-05-13 03:28:37,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +29: [2023-05-13 03:28:37,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +29: [2023-05-13 03:28:37,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +14: [2023-05-13 03:28:37,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +15: [2023-05-13 03:28:37,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +31: [2023-05-13 03:28:37,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +31: [2023-05-13 03:28:37,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +31: [2023-05-13 03:28:37,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +16: [2023-05-13 03:28:37,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +16: [2023-05-13 03:28:37,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +31: [2023-05-13 03:28:37,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:37,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +23: [2023-05-13 03:28:37,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +18: [2023-05-13 03:28:37,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +18: [2023-05-13 03:28:37,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +18: [2023-05-13 03:28:37,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +14: [2023-05-13 03:28:37,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +16: [2023-05-13 03:28:37,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +16: [2023-05-13 03:28:37,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +16: [2023-05-13 03:28:37,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +14: [2023-05-13 03:28:37,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +16: [2023-05-13 03:28:37,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +29: [2023-05-13 03:28:37,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +27: [2023-05-13 03:28:37,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:37,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +29: [2023-05-13 03:28:37,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +18: [2023-05-13 03:28:37,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +19: [2023-05-13 03:28:37,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +19: [2023-05-13 03:28:37,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +19: [2023-05-13 03:28:37,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +19: [2023-05-13 03:28:37,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +19: [2023-05-13 03:28:37,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +19: [2023-05-13 03:28:37,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +19: [2023-05-13 03:28:37,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +27: [2023-05-13 03:28:37,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +27: [2023-05-13 03:28:37,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +19: [2023-05-13 03:28:37,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +27: [2023-05-13 03:28:37,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +27: [2023-05-13 03:28:37,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +15: [2023-05-13 03:28:37,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +15: [2023-05-13 03:28:37,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +29: [2023-05-13 03:28:37,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +29: [2023-05-13 03:28:37,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +19: [2023-05-13 03:28:37,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +15: [2023-05-13 03:28:37,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +18: [2023-05-13 03:28:37,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +19: [2023-05-13 03:28:37,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +19: [2023-05-13 03:28:37,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +19: [2023-05-13 03:28:37,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +19: [2023-05-13 03:28:37,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +15: [2023-05-13 03:28:37,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +15: [2023-05-13 03:28:37,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +19: [2023-05-13 03:28:37,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +19: [2023-05-13 03:28:37,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +18: [2023-05-13 03:28:37,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +19: [2023-05-13 03:28:37,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +18: [2023-05-13 03:28:37,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +23: [2023-05-13 03:28:37,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +18: [2023-05-13 03:28:37,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +15: [2023-05-13 03:28:37,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:37,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +23: [2023-05-13 03:28:37,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +23: [2023-05-13 03:28:37,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +23: [2023-05-13 03:28:37,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +24: [2023-05-13 03:28:37,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +24: [2023-05-13 03:28:37,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +24: [2023-05-13 03:28:37,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +24: [2023-05-13 03:28:37,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +24: [2023-05-13 03:28:37,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +24: [2023-05-13 03:28:37,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +24: [2023-05-13 03:28:37,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +24: [2023-05-13 03:28:37,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +10: [2023-05-13 03:28:37,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +10: [2023-05-13 03:28:37,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +10: [2023-05-13 03:28:37,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +10: [2023-05-13 03:28:37,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +10: [2023-05-13 03:28:37,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +10: [2023-05-13 03:28:37,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +10: [2023-05-13 03:28:37,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +10: [2023-05-13 03:28:37,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:37,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +11: [2023-05-13 03:28:37,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +11: [2023-05-13 03:28:37,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +11: [2023-05-13 03:28:37,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +28: [2023-05-13 03:28:37,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +11: [2023-05-13 03:28:37,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +11: [2023-05-13 03:28:37,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +11: [2023-05-13 03:28:37,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +28: [2023-05-13 03:28:37,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +11: [2023-05-13 03:28:37,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +28: [2023-05-13 03:28:37,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +28: [2023-05-13 03:28:37,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +28: [2023-05-13 03:28:37,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +28: [2023-05-13 03:28:37,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +28: [2023-05-13 03:28:37,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +28: [2023-05-13 03:28:37,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +11: [2023-05-13 03:28:37,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +10: [2023-05-13 03:28:37,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +10: [2023-05-13 03:28:37,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +24: [2023-05-13 03:28:37,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +24: [2023-05-13 03:28:37,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +24: [2023-05-13 03:28:37,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +28: [2023-05-13 03:28:37,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +24: [2023-05-13 03:28:37,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +24: [2023-05-13 03:28:37,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +24: [2023-05-13 03:28:37,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +24: [2023-05-13 03:28:37,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +24: [2023-05-13 03:28:37,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +10: [2023-05-13 03:28:37,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +10: [2023-05-13 03:28:37,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +10: [2023-05-13 03:28:37,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +10: [2023-05-13 03:28:37,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +10: [2023-05-13 03:28:37,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +10: [2023-05-13 03:28:37,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:37,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +30: [2023-05-13 03:28:37,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +30: [2023-05-13 03:28:37,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +28: [2023-05-13 03:28:37,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:37,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +30: [2023-05-13 03:28:37,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +30: [2023-05-13 03:28:37,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +30: [2023-05-13 03:28:37,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +30: [2023-05-13 03:28:37,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +30: [2023-05-13 03:28:37,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +30: [2023-05-13 03:28:37,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +28: [2023-05-13 03:28:37,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:37,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:37,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +28: [2023-05-13 03:28:37,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:37,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +28: [2023-05-13 03:28:37,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:37,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:37,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +28: [2023-05-13 03:28:37,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +28: [2023-05-13 03:28:37,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +28: [2023-05-13 03:28:37,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +30: [2023-05-13 03:28:37,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +30: [2023-05-13 03:28:37,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +30: [2023-05-13 03:28:37,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +30: [2023-05-13 03:28:37,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +30: [2023-05-13 03:28:37,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +30: [2023-05-13 03:28:37,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +30: [2023-05-13 03:28:37,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +30: [2023-05-13 03:28:37,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +19: [2023-05-13 03:28:37,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +17: [2023-05-13 03:28:37,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +19: [2023-05-13 03:28:37,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +17: [2023-05-13 03:28:37,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +17: [2023-05-13 03:28:37,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +17: [2023-05-13 03:28:37,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +17: [2023-05-13 03:28:37,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +17: [2023-05-13 03:28:37,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +17: [2023-05-13 03:28:37,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +19: [2023-05-13 03:28:37,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +19: [2023-05-13 03:28:37,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +17: [2023-05-13 03:28:37,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +17: [2023-05-13 03:28:37,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:37,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +25: [2023-05-13 03:28:37,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +25: [2023-05-13 03:28:37,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +25: [2023-05-13 03:28:37,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +25: [2023-05-13 03:28:37,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +25: [2023-05-13 03:28:37,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +25: [2023-05-13 03:28:37,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +25: [2023-05-13 03:28:37,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +25: [2023-05-13 03:28:37,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +25: [2023-05-13 03:28:37,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +17: [2023-05-13 03:28:37,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +17: [2023-05-13 03:28:37,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +25: [2023-05-13 03:28:37,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +19: [2023-05-13 03:28:37,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +25: [2023-05-13 03:28:37,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +17: [2023-05-13 03:28:37,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +17: [2023-05-13 03:28:37,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +17: [2023-05-13 03:28:37,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +25: [2023-05-13 03:28:37,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +25: [2023-05-13 03:28:37,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +17: [2023-05-13 03:28:37,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +17: [2023-05-13 03:28:37,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +19: [2023-05-13 03:28:37,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +19: [2023-05-13 03:28:37,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +19: [2023-05-13 03:28:37,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +25: [2023-05-13 03:28:37,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +25: [2023-05-13 03:28:37,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +28: [2023-05-13 03:28:37,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +25: [2023-05-13 03:28:37,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +10: [2023-05-13 03:28:37,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +10: [2023-05-13 03:28:37,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +24: [2023-05-13 03:28:37,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +19: [2023-05-13 03:28:37,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +24: [2023-05-13 03:28:37,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +24: [2023-05-13 03:28:37,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +24: [2023-05-13 03:28:37,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:37,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +19: [2023-05-13 03:28:37,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +19: [2023-05-13 03:28:37,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +30: [2023-05-13 03:28:37,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +19: [2023-05-13 03:28:37,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +10: [2023-05-13 03:28:37,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +30: [2023-05-13 03:28:37,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +30: [2023-05-13 03:28:37,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +28: [2023-05-13 03:28:37,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +24: [2023-05-13 03:28:37,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +24: [2023-05-13 03:28:37,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +24: [2023-05-13 03:28:37,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +24: [2023-05-13 03:28:37,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +10: [2023-05-13 03:28:37,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +10: [2023-05-13 03:28:37,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +10: [2023-05-13 03:28:37,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +30: [2023-05-13 03:28:37,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +19: [2023-05-13 03:28:37,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +24: [2023-05-13 03:28:37,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +19: [2023-05-13 03:28:37,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +19: [2023-05-13 03:28:37,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:37,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +11: [2023-05-13 03:28:37,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +11: [2023-05-13 03:28:37,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +19: [2023-05-13 03:28:37,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +28: [2023-05-13 03:28:37,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +28: [2023-05-13 03:28:37,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +28: [2023-05-13 03:28:37,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +10: [2023-05-13 03:28:37,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +10: [2023-05-13 03:28:37,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +10: [2023-05-13 03:28:37,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +10: [2023-05-13 03:28:37,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +30: [2023-05-13 03:28:37,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +24: [2023-05-13 03:28:37,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +24: [2023-05-13 03:28:37,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +24: [2023-05-13 03:28:37,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +28: [2023-05-13 03:28:37,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +28: [2023-05-13 03:28:37,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +28: [2023-05-13 03:28:37,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +17: [2023-05-13 03:28:37,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +11: [2023-05-13 03:28:37,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +30: [2023-05-13 03:28:37,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +11: [2023-05-13 03:28:37,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +11: [2023-05-13 03:28:37,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +11: [2023-05-13 03:28:37,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +30: [2023-05-13 03:28:37,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +30: [2023-05-13 03:28:37,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +30: [2023-05-13 03:28:37,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +30: [2023-05-13 03:28:37,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +10: [2023-05-13 03:28:37,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +30: [2023-05-13 03:28:37,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +25: [2023-05-13 03:28:37,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +24: [2023-05-13 03:28:37,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +10: [2023-05-13 03:28:37,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +24: [2023-05-13 03:28:37,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +24: [2023-05-13 03:28:37,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +30: [2023-05-13 03:28:37,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +24: [2023-05-13 03:28:37,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +25: [2023-05-13 03:28:37,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +25: [2023-05-13 03:28:37,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +25: [2023-05-13 03:28:37,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +17: [2023-05-13 03:28:37,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +30: [2023-05-13 03:28:37,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +25: [2023-05-13 03:28:37,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +10: [2023-05-13 03:28:37,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +10: [2023-05-13 03:28:37,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +10: [2023-05-13 03:28:37,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +17: [2023-05-13 03:28:37,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +25: [2023-05-13 03:28:37,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +25: [2023-05-13 03:28:37,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +25: [2023-05-13 03:28:37,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +10: [2023-05-13 03:28:37,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +25: [2023-05-13 03:28:37,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +30: [2023-05-13 03:28:37,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +30: [2023-05-13 03:28:37,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +30: [2023-05-13 03:28:37,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +17: [2023-05-13 03:28:37,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +17: [2023-05-13 03:28:37,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +17: [2023-05-13 03:28:37,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +11: [2023-05-13 03:28:37,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +17: [2023-05-13 03:28:37,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +28: [2023-05-13 03:28:37,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +11: [2023-05-13 03:28:37,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +28: [2023-05-13 03:28:37,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +11: [2023-05-13 03:28:37,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +28: [2023-05-13 03:28:37,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +11: [2023-05-13 03:28:37,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +28: [2023-05-13 03:28:37,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +11: [2023-05-13 03:28:37,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +28: [2023-05-13 03:28:37,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +11: [2023-05-13 03:28:37,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +28: [2023-05-13 03:28:37,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +11: [2023-05-13 03:28:37,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +28: [2023-05-13 03:28:37,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +28: [2023-05-13 03:28:37,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +25: [2023-05-13 03:28:37,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +25: [2023-05-13 03:28:37,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +25: [2023-05-13 03:28:37,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +17: [2023-05-13 03:28:37,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +17: [2023-05-13 03:28:37,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +25: [2023-05-13 03:28:37,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +25: [2023-05-13 03:28:37,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +25: [2023-05-13 03:28:37,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +17: [2023-05-13 03:28:37,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +25: [2023-05-13 03:28:37,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +17: [2023-05-13 03:28:37,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +17: [2023-05-13 03:28:37,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +17: [2023-05-13 03:28:37,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +17: [2023-05-13 03:28:37,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +17: [2023-05-13 03:28:37,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +17: [2023-05-13 03:28:37,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +16: [2023-05-13 03:28:37,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:37,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:37,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:37,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:37,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:37,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:37,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:37,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:37,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +16: [2023-05-13 03:28:37,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +16: [2023-05-13 03:28:37,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +16: [2023-05-13 03:28:37,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +16: [2023-05-13 03:28:37,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +16: [2023-05-13 03:28:37,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +16: [2023-05-13 03:28:37,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +16: [2023-05-13 03:28:37,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +18: [2023-05-13 03:28:37,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +18: [2023-05-13 03:28:37,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +18: [2023-05-13 03:28:37,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +18: [2023-05-13 03:28:37,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +18: [2023-05-13 03:28:37,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +18: [2023-05-13 03:28:37,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +18: [2023-05-13 03:28:37,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +18: [2023-05-13 03:28:37,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +18: [2023-05-13 03:28:37,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +18: [2023-05-13 03:28:37,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +18: [2023-05-13 03:28:37,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +18: [2023-05-13 03:28:37,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +18: [2023-05-13 03:28:37,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +18: [2023-05-13 03:28:37,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +18: [2023-05-13 03:28:37,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +18: [2023-05-13 03:28:37,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +13: [2023-05-13 03:28:37,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +13: [2023-05-13 03:28:37,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +13: [2023-05-13 03:28:37,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +13: [2023-05-13 03:28:37,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +13: [2023-05-13 03:28:37,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +13: [2023-05-13 03:28:37,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +13: [2023-05-13 03:28:37,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +13: [2023-05-13 03:28:37,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +13: [2023-05-13 03:28:37,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +13: [2023-05-13 03:28:37,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +13: [2023-05-13 03:28:37,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +13: [2023-05-13 03:28:37,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +13: [2023-05-13 03:28:37,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +13: [2023-05-13 03:28:37,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +13: [2023-05-13 03:28:37,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +13: [2023-05-13 03:28:37,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +23: [2023-05-13 03:28:37,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +23: [2023-05-13 03:28:37,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:37,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:37,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +23: [2023-05-13 03:28:37,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +23: [2023-05-13 03:28:37,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +23: [2023-05-13 03:28:37,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +23: [2023-05-13 03:28:37,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:37,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:37,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +23: [2023-05-13 03:28:37,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +23: [2023-05-13 03:28:37,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +23: [2023-05-13 03:28:37,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +26: [2023-05-13 03:28:37,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +26: [2023-05-13 03:28:37,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +26: [2023-05-13 03:28:37,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +26: [2023-05-13 03:28:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +26: [2023-05-13 03:28:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +26: [2023-05-13 03:28:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +26: [2023-05-13 03:28:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +26: [2023-05-13 03:28:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +23: [2023-05-13 03:28:37,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +23: [2023-05-13 03:28:37,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +23: [2023-05-13 03:28:37,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +23: [2023-05-13 03:28:37,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +26: [2023-05-13 03:28:37,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +23: [2023-05-13 03:28:37,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +26: [2023-05-13 03:28:37,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +26: [2023-05-13 03:28:37,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +26: [2023-05-13 03:28:37,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +26: [2023-05-13 03:28:37,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +26: [2023-05-13 03:28:37,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +26: [2023-05-13 03:28:37,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +16: [2023-05-13 03:28:37,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +26: [2023-05-13 03:28:37,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +21: [2023-05-13 03:28:37,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +21: [2023-05-13 03:28:37,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +16: [2023-05-13 03:28:37,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:37,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +21: [2023-05-13 03:28:37,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +21: [2023-05-13 03:28:37,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +16: [2023-05-13 03:28:37,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +21: [2023-05-13 03:28:37,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +21: [2023-05-13 03:28:37,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +21: [2023-05-13 03:28:37,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +21: [2023-05-13 03:28:37,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +18: [2023-05-13 03:28:37,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +18: [2023-05-13 03:28:37,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +27: [2023-05-13 03:28:37,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +27: [2023-05-13 03:28:37,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +27: [2023-05-13 03:28:37,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +27: [2023-05-13 03:28:37,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +27: [2023-05-13 03:28:37,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +27: [2023-05-13 03:28:37,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +27: [2023-05-13 03:28:37,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +27: [2023-05-13 03:28:37,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +21: [2023-05-13 03:28:37,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +21: [2023-05-13 03:28:37,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +16: [2023-05-13 03:28:37,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +21: [2023-05-13 03:28:37,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +16: [2023-05-13 03:28:37,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:37,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +27: [2023-05-13 03:28:37,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +21: [2023-05-13 03:28:37,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +16: [2023-05-13 03:28:37,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +21: [2023-05-13 03:28:37,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +21: [2023-05-13 03:28:37,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +21: [2023-05-13 03:28:37,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +21: [2023-05-13 03:28:37,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +27: [2023-05-13 03:28:37,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +27: [2023-05-13 03:28:37,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +19: [2023-05-13 03:28:37,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +19: [2023-05-13 03:28:37,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +27: [2023-05-13 03:28:37,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +27: [2023-05-13 03:28:37,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +19: [2023-05-13 03:28:37,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +18: [2023-05-13 03:28:37,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +19: [2023-05-13 03:28:37,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +19: [2023-05-13 03:28:37,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +19: [2023-05-13 03:28:37,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +19: [2023-05-13 03:28:37,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +19: [2023-05-13 03:28:37,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +27: [2023-05-13 03:28:37,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +27: [2023-05-13 03:28:37,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +18: [2023-05-13 03:28:37,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +27: [2023-05-13 03:28:37,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 3: [2023-05-13 03:28:37,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +19: [2023-05-13 03:28:37,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +19: [2023-05-13 03:28:37,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +19: [2023-05-13 03:28:37,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +18: [2023-05-13 03:28:37,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +19: [2023-05-13 03:28:37,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +19: [2023-05-13 03:28:37,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +19: [2023-05-13 03:28:37,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +19: [2023-05-13 03:28:37,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +19: [2023-05-13 03:28:37,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +18: [2023-05-13 03:28:37,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 3: [2023-05-13 03:28:37,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +13: [2023-05-13 03:28:37,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +18: [2023-05-13 03:28:37,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +13: [2023-05-13 03:28:37,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +13: [2023-05-13 03:28:37,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +18: [2023-05-13 03:28:37,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +18: [2023-05-13 03:28:37,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:37,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +16: [2023-05-13 03:28:37,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:37,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +25: [2023-05-13 03:28:37,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +25: [2023-05-13 03:28:37,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +16: [2023-05-13 03:28:37,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +25: [2023-05-13 03:28:37,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +25: [2023-05-13 03:28:37,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +25: [2023-05-13 03:28:37,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +25: [2023-05-13 03:28:37,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +25: [2023-05-13 03:28:37,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +18: [2023-05-13 03:28:37,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:37,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +25: [2023-05-13 03:28:37,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 0: [2023-05-13 03:28:37,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +22: [2023-05-13 03:28:37,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +22: [2023-05-13 03:28:37,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +22: [2023-05-13 03:28:37,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +22: [2023-05-13 03:28:37,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +22: [2023-05-13 03:28:37,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +22: [2023-05-13 03:28:37,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +22: [2023-05-13 03:28:37,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +22: [2023-05-13 03:28:37,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +16: [2023-05-13 03:28:37,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +25: [2023-05-13 03:28:37,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +25: [2023-05-13 03:28:37,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +16: [2023-05-13 03:28:37,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +25: [2023-05-13 03:28:37,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +25: [2023-05-13 03:28:37,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +13: [2023-05-13 03:28:37,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +13: [2023-05-13 03:28:37,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +26: [2023-05-13 03:28:37,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +13: [2023-05-13 03:28:37,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +25: [2023-05-13 03:28:37,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +25: [2023-05-13 03:28:37,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +25: [2023-05-13 03:28:37,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +22: [2023-05-13 03:28:37,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +22: [2023-05-13 03:28:37,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +22: [2023-05-13 03:28:37,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +18: [2023-05-13 03:28:37,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:37,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +25: [2023-05-13 03:28:37,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 1: [2023-05-13 03:28:37,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +18: [2023-05-13 03:28:37,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:37,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +22: [2023-05-13 03:28:37,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +22: [2023-05-13 03:28:37,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +22: [2023-05-13 03:28:37,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +22: [2023-05-13 03:28:37,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +22: [2023-05-13 03:28:37,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +24: [2023-05-13 03:28:37,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +24: [2023-05-13 03:28:37,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +24: [2023-05-13 03:28:37,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +24: [2023-05-13 03:28:37,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +24: [2023-05-13 03:28:37,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +24: [2023-05-13 03:28:37,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +24: [2023-05-13 03:28:37,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +24: [2023-05-13 03:28:37,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +14: [2023-05-13 03:28:37,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +14: [2023-05-13 03:28:37,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +31: [2023-05-13 03:28:37,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +31: [2023-05-13 03:28:37,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +26: [2023-05-13 03:28:37,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +26: [2023-05-13 03:28:37,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +13: [2023-05-13 03:28:37,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +14: [2023-05-13 03:28:37,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +14: [2023-05-13 03:28:37,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +14: [2023-05-13 03:28:37,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +14: [2023-05-13 03:28:37,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +14: [2023-05-13 03:28:37,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +14: [2023-05-13 03:28:37,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +29: [2023-05-13 03:28:37,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +29: [2023-05-13 03:28:37,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +31: [2023-05-13 03:28:37,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +31: [2023-05-13 03:28:37,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +31: [2023-05-13 03:28:37,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +31: [2023-05-13 03:28:37,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +31: [2023-05-13 03:28:37,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +29: [2023-05-13 03:28:37,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +29: [2023-05-13 03:28:37,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +31: [2023-05-13 03:28:37,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +29: [2023-05-13 03:28:37,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +29: [2023-05-13 03:28:37,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +29: [2023-05-13 03:28:37,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +21: [2023-05-13 03:28:37,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +29: [2023-05-13 03:28:37,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +26: [2023-05-13 03:28:37,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +31: [2023-05-13 03:28:37,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +31: [2023-05-13 03:28:37,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +18: [2023-05-13 03:28:37,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +14: [2023-05-13 03:28:37,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +29: [2023-05-13 03:28:37,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +24: [2023-05-13 03:28:37,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +24: [2023-05-13 03:28:37,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +24: [2023-05-13 03:28:37,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +29: [2023-05-13 03:28:37,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +15: [2023-05-13 03:28:37,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +24: [2023-05-13 03:28:37,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +24: [2023-05-13 03:28:37,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +15: [2023-05-13 03:28:37,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +15: [2023-05-13 03:28:37,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +15: [2023-05-13 03:28:37,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +15: [2023-05-13 03:28:37,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +15: [2023-05-13 03:28:37,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +24: [2023-05-13 03:28:37,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +15: [2023-05-13 03:28:37,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +18: [2023-05-13 03:28:37,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +15: [2023-05-13 03:28:37,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +11: [2023-05-13 03:28:37,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +24: [2023-05-13 03:28:37,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +14: [2023-05-13 03:28:37,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +14: [2023-05-13 03:28:37,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +14: [2023-05-13 03:28:37,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +14: [2023-05-13 03:28:37,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +11: [2023-05-13 03:28:37,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +11: [2023-05-13 03:28:37,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +11: [2023-05-13 03:28:37,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +11: [2023-05-13 03:28:37,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +11: [2023-05-13 03:28:37,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +11: [2023-05-13 03:28:37,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +23: [2023-05-13 03:28:37,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +24: [2023-05-13 03:28:37,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +13: [2023-05-13 03:28:37,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +14: [2023-05-13 03:28:37,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:37,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +12: [2023-05-13 03:28:37,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +12: [2023-05-13 03:28:37,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +14: [2023-05-13 03:28:37,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +14: [2023-05-13 03:28:37,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:37,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +12: [2023-05-13 03:28:37,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +12: [2023-05-13 03:28:37,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +12: [2023-05-13 03:28:37,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +29: [2023-05-13 03:28:37,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:37,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +18: [2023-05-13 03:28:37,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +18: [2023-05-13 03:28:37,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 1: [2023-05-13 03:28:37,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +15: [2023-05-13 03:28:37,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +26: [2023-05-13 03:28:37,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +21: [2023-05-13 03:28:37,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +21: [2023-05-13 03:28:37,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +31: [2023-05-13 03:28:37,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +29: [2023-05-13 03:28:37,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +29: [2023-05-13 03:28:37,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +27: [2023-05-13 03:28:37,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +31: [2023-05-13 03:28:37,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +29: [2023-05-13 03:28:37,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +26: [2023-05-13 03:28:37,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +31: [2023-05-13 03:28:37,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +31: [2023-05-13 03:28:37,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +31: [2023-05-13 03:28:37,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +31: [2023-05-13 03:28:37,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +29: [2023-05-13 03:28:37,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +29: [2023-05-13 03:28:37,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:37,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +12: [2023-05-13 03:28:37,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +12: [2023-05-13 03:28:37,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +13: [2023-05-13 03:28:37,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +12: [2023-05-13 03:28:37,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +12: [2023-05-13 03:28:37,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +12: [2023-05-13 03:28:37,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +15: [2023-05-13 03:28:37,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:37,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:37,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +26: [2023-05-13 03:28:37,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +13: [2023-05-13 03:28:37,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +15: [2023-05-13 03:28:37,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +15: [2023-05-13 03:28:37,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:37,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +15: [2023-05-13 03:28:37,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +15: [2023-05-13 03:28:37,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:37,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +23: [2023-05-13 03:28:37,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +23: [2023-05-13 03:28:37,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +15: [2023-05-13 03:28:37,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +15: [2023-05-13 03:28:37,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:37,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +26: [2023-05-13 03:28:37,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +23: [2023-05-13 03:28:37,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +13: [2023-05-13 03:28:37,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +13: [2023-05-13 03:28:37,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:37,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 2: [2023-05-13 03:28:37,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +26: [2023-05-13 03:28:37,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +26: [2023-05-13 03:28:37,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +21: [2023-05-13 03:28:37,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +26: [2023-05-13 03:28:37,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +21: [2023-05-13 03:28:37,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +21: [2023-05-13 03:28:37,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +21: [2023-05-13 03:28:37,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +21: [2023-05-13 03:28:37,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +21: [2023-05-13 03:28:37,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +30: [2023-05-13 03:28:37,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +30: [2023-05-13 03:28:37,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +30: [2023-05-13 03:28:37,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +30: [2023-05-13 03:28:37,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +30: [2023-05-13 03:28:37,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +30: [2023-05-13 03:28:37,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +30: [2023-05-13 03:28:37,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +30: [2023-05-13 03:28:37,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +19: [2023-05-13 03:28:37,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +19: [2023-05-13 03:28:37,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +26: [2023-05-13 03:28:37,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +19: [2023-05-13 03:28:37,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +19: [2023-05-13 03:28:37,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +27: [2023-05-13 03:28:37,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +21: [2023-05-13 03:28:37,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +19: [2023-05-13 03:28:37,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +19: [2023-05-13 03:28:37,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +21: [2023-05-13 03:28:37,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +30: [2023-05-13 03:28:37,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +30: [2023-05-13 03:28:37,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +30: [2023-05-13 03:28:37,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +30: [2023-05-13 03:28:37,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +19: [2023-05-13 03:28:37,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +19: [2023-05-13 03:28:37,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +26: [2023-05-13 03:28:37,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +30: [2023-05-13 03:28:37,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +30: [2023-05-13 03:28:37,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +30: [2023-05-13 03:28:37,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +27: [2023-05-13 03:28:37,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +27: [2023-05-13 03:28:37,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +27: [2023-05-13 03:28:37,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +30: [2023-05-13 03:28:37,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +27: [2023-05-13 03:28:37,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +25: [2023-05-13 03:28:37,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +25: [2023-05-13 03:28:37,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +25: [2023-05-13 03:28:37,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +22: [2023-05-13 03:28:37,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +22: [2023-05-13 03:28:37,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +27: [2023-05-13 03:28:37,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +26: [2023-05-13 03:28:37,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:37,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +26: [2023-05-13 03:28:37,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +11: [2023-05-13 03:28:37,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +11: [2023-05-13 03:28:37,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +11: [2023-05-13 03:28:37,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +11: [2023-05-13 03:28:37,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +11: [2023-05-13 03:28:37,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +11: [2023-05-13 03:28:37,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +11: [2023-05-13 03:28:37,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +11: [2023-05-13 03:28:37,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +21: [2023-05-13 03:28:37,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:37,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +23: [2023-05-13 03:28:37,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:37,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:37,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:37,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +23: [2023-05-13 03:28:37,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +25: [2023-05-13 03:28:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +31: [2023-05-13 03:28:37,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +31: [2023-05-13 03:28:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 7: [2023-05-13 03:28:37,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +14: [2023-05-13 03:28:37,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +21: [2023-05-13 03:28:37,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 7: [2023-05-13 03:28:37,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +29: [2023-05-13 03:28:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +29: [2023-05-13 03:28:37,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +19: [2023-05-13 03:28:37,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +21: [2023-05-13 03:28:37,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +15: [2023-05-13 03:28:37,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +25: [2023-05-13 03:28:37,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +25: [2023-05-13 03:28:37,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +25: [2023-05-13 03:28:37,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +21: [2023-05-13 03:28:37,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +21: [2023-05-13 03:28:37,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +25: [2023-05-13 03:28:37,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +14: [2023-05-13 03:28:37,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +14: [2023-05-13 03:28:37,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +19: [2023-05-13 03:28:37,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 2: [2023-05-13 03:28:37,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +22: [2023-05-13 03:28:37,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +24: [2023-05-13 03:28:37,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +24: [2023-05-13 03:28:37,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +24: [2023-05-13 03:28:37,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +19: [2023-05-13 03:28:37,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +19: [2023-05-13 03:28:37,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +19: [2023-05-13 03:28:37,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +24: [2023-05-13 03:28:37,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +29: [2023-05-13 03:28:37,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +10: [2023-05-13 03:28:37,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +14: [2023-05-13 03:28:37,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +10: [2023-05-13 03:28:37,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +10: [2023-05-13 03:28:37,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +10: [2023-05-13 03:28:37,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +10: [2023-05-13 03:28:37,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +10: [2023-05-13 03:28:37,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +10: [2023-05-13 03:28:37,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +10: [2023-05-13 03:28:37,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +25: [2023-05-13 03:28:37,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +19: [2023-05-13 03:28:37,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +22: [2023-05-13 03:28:37,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +25: [2023-05-13 03:28:37,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +22: [2023-05-13 03:28:37,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +22: [2023-05-13 03:28:37,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +25: [2023-05-13 03:28:37,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +10: [2023-05-13 03:28:37,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +10: [2023-05-13 03:28:37,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +19: [2023-05-13 03:28:37,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +19: [2023-05-13 03:28:37,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +22: [2023-05-13 03:28:37,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +22: [2023-05-13 03:28:37,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +22: [2023-05-13 03:28:37,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +22: [2023-05-13 03:28:37,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +14: [2023-05-13 03:28:37,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:37,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +12: [2023-05-13 03:28:37,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +27: [2023-05-13 03:28:37,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +12: [2023-05-13 03:28:37,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +12: [2023-05-13 03:28:37,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +12: [2023-05-13 03:28:37,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 9: [2023-05-13 03:28:37,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +10: [2023-05-13 03:28:37,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +10: [2023-05-13 03:28:37,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +10: [2023-05-13 03:28:37,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:37,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +24: [2023-05-13 03:28:37,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +24: [2023-05-13 03:28:37,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +24: [2023-05-13 03:28:37,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +10: [2023-05-13 03:28:37,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +10: [2023-05-13 03:28:37,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +10: [2023-05-13 03:28:37,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +31: [2023-05-13 03:28:37,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +14: [2023-05-13 03:28:37,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +14: [2023-05-13 03:28:37,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +14: [2023-05-13 03:28:37,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +27: [2023-05-13 03:28:37,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +27: [2023-05-13 03:28:37,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +27: [2023-05-13 03:28:37,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +31: [2023-05-13 03:28:37,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +29: [2023-05-13 03:28:37,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +29: [2023-05-13 03:28:37,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +15: [2023-05-13 03:28:37,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +24: [2023-05-13 03:28:37,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +14: [2023-05-13 03:28:37,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +27: [2023-05-13 03:28:37,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +31: [2023-05-13 03:28:37,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +31: [2023-05-13 03:28:37,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +31: [2023-05-13 03:28:37,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +14: [2023-05-13 03:28:37,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +31: [2023-05-13 03:28:37,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +31: [2023-05-13 03:28:37,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +31: [2023-05-13 03:28:37,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +27: [2023-05-13 03:28:37,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +17: [2023-05-13 03:28:37,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +27: [2023-05-13 03:28:37,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +15: [2023-05-13 03:28:37,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +17: [2023-05-13 03:28:37,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +17: [2023-05-13 03:28:37,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +17: [2023-05-13 03:28:37,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +17: [2023-05-13 03:28:37,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +17: [2023-05-13 03:28:37,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +17: [2023-05-13 03:28:37,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +17: [2023-05-13 03:28:37,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +29: [2023-05-13 03:28:37,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +25: [2023-05-13 03:28:37,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +14: [2023-05-13 03:28:37,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +12: [2023-05-13 03:28:37,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +25: [2023-05-13 03:28:37,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +22: [2023-05-13 03:28:37,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +17: [2023-05-13 03:28:37,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +15: [2023-05-13 03:28:37,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +29: [2023-05-13 03:28:37,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +29: [2023-05-13 03:28:37,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +29: [2023-05-13 03:28:37,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +29: [2023-05-13 03:28:37,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +24: [2023-05-13 03:28:37,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +24: [2023-05-13 03:28:37,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +29: [2023-05-13 03:28:37,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +25: [2023-05-13 03:28:37,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +24: [2023-05-13 03:28:37,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +30: [2023-05-13 03:28:37,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +30: [2023-05-13 03:28:37,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +24: [2023-05-13 03:28:37,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +25: [2023-05-13 03:28:37,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +11: [2023-05-13 03:28:37,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +11: [2023-05-13 03:28:37,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +11: [2023-05-13 03:28:37,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +25: [2023-05-13 03:28:37,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +11: [2023-05-13 03:28:37,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +11: [2023-05-13 03:28:37,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +11: [2023-05-13 03:28:37,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +12: [2023-05-13 03:28:37,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +12: [2023-05-13 03:28:37,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 6: [2023-05-13 03:28:37,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 6: [2023-05-13 03:28:37,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +14: [2023-05-13 03:28:37,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +30: [2023-05-13 03:28:37,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +30: [2023-05-13 03:28:37,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +17: [2023-05-13 03:28:37,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +17: [2023-05-13 03:28:37,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +17: [2023-05-13 03:28:37,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +17: [2023-05-13 03:28:37,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +11: [2023-05-13 03:28:37,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +11: [2023-05-13 03:28:37,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +11: [2023-05-13 03:28:37,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +17: [2023-05-13 03:28:37,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +17: [2023-05-13 03:28:37,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +22: [2023-05-13 03:28:37,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:37,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +17: [2023-05-13 03:28:37,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +28: [2023-05-13 03:28:37,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +28: [2023-05-13 03:28:37,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +28: [2023-05-13 03:28:37,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +28: [2023-05-13 03:28:37,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +28: [2023-05-13 03:28:37,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +28: [2023-05-13 03:28:37,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +28: [2023-05-13 03:28:37,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +12: [2023-05-13 03:28:37,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +12: [2023-05-13 03:28:37,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +15: [2023-05-13 03:28:37,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +15: [2023-05-13 03:28:37,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +15: [2023-05-13 03:28:37,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +15: [2023-05-13 03:28:37,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +15: [2023-05-13 03:28:37,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +30: [2023-05-13 03:28:37,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +14: [2023-05-13 03:28:37,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +22: [2023-05-13 03:28:37,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +14: [2023-05-13 03:28:37,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:37,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +27: [2023-05-13 03:28:37,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 8: [2023-05-13 03:28:37,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +14: [2023-05-13 03:28:37,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +24: [2023-05-13 03:28:37,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +24: [2023-05-13 03:28:37,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:37,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +14: [2023-05-13 03:28:37,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +27: [2023-05-13 03:28:37,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +22: [2023-05-13 03:28:37,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +12: [2023-05-13 03:28:37,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +22: [2023-05-13 03:28:37,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +22: [2023-05-13 03:28:37,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +12: [2023-05-13 03:28:37,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +24: [2023-05-13 03:28:37,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +24: [2023-05-13 03:28:37,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +30: [2023-05-13 03:28:37,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +30: [2023-05-13 03:28:37,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +30: [2023-05-13 03:28:37,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 5: [2023-05-13 03:28:37,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +15: [2023-05-13 03:28:37,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:37,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +28: [2023-05-13 03:28:37,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:37,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +28: [2023-05-13 03:28:37,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +28: [2023-05-13 03:28:37,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +30: [2023-05-13 03:28:37,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:37,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +28: [2023-05-13 03:28:37,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 5: [2023-05-13 03:28:37,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +11: [2023-05-13 03:28:37,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +30: [2023-05-13 03:28:37,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +29: [2023-05-13 03:28:37,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +10: [2023-05-13 03:28:37,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +15: [2023-05-13 03:28:37,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +12: [2023-05-13 03:28:37,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +29: [2023-05-13 03:28:37,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +29: [2023-05-13 03:28:37,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +12: [2023-05-13 03:28:37,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +12: [2023-05-13 03:28:37,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +10: [2023-05-13 03:28:37,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +29: [2023-05-13 03:28:37,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +29: [2023-05-13 03:28:37,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +30: [2023-05-13 03:28:37,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +30: [2023-05-13 03:28:37,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +11: [2023-05-13 03:28:37,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +31: [2023-05-13 03:28:37,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +31: [2023-05-13 03:28:37,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +31: [2023-05-13 03:28:37,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +31: [2023-05-13 03:28:37,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +31: [2023-05-13 03:28:37,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +31: [2023-05-13 03:28:37,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +11: [2023-05-13 03:28:37,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +11: [2023-05-13 03:28:37,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +30: [2023-05-13 03:28:37,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +11: [2023-05-13 03:28:37,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +11: [2023-05-13 03:28:37,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +11: [2023-05-13 03:28:37,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +15: [2023-05-13 03:28:37,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +10: [2023-05-13 03:28:37,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +30: [2023-05-13 03:28:37,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +30: [2023-05-13 03:28:37,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 8: [2023-05-13 03:28:37,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +17: [2023-05-13 03:28:37,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +30: [2023-05-13 03:28:37,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +10: [2023-05-13 03:28:37,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +10: [2023-05-13 03:28:37,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +10: [2023-05-13 03:28:37,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +15: [2023-05-13 03:28:37,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +15: [2023-05-13 03:28:37,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +15: [2023-05-13 03:28:37,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +15: [2023-05-13 03:28:37,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:37,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +10: [2023-05-13 03:28:37,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +10: [2023-05-13 03:28:37,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +10: [2023-05-13 03:28:37,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +10: [2023-05-13 03:28:37,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 0: [2023-05-13 03:28:37,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +17: [2023-05-13 03:28:38,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +16: [2023-05-13 03:28:38,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +16: [2023-05-13 03:28:38,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +16: [2023-05-13 03:28:38,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +16: [2023-05-13 03:28:38,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +16: [2023-05-13 03:28:38,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +16: [2023-05-13 03:28:38,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +16: [2023-05-13 03:28:38,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +16: [2023-05-13 03:28:38,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +17: [2023-05-13 03:28:38,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +16: [2023-05-13 03:28:38,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +16: [2023-05-13 03:28:38,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +10: [2023-05-13 03:28:38,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:38,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +16: [2023-05-13 03:28:38,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +16: [2023-05-13 03:28:38,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +16: [2023-05-13 03:28:38,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +16: [2023-05-13 03:28:38,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +16: [2023-05-13 03:28:38,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +16: [2023-05-13 03:28:38,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +17: [2023-05-13 03:28:38,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +10: [2023-05-13 03:28:38,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +17: [2023-05-13 03:28:38,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +17: [2023-05-13 03:28:38,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +10: [2023-05-13 03:28:38,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +17: [2023-05-13 03:28:38,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +10: [2023-05-13 03:28:38,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +17: [2023-05-13 03:28:38,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +10: [2023-05-13 03:28:38,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +10: [2023-05-13 03:28:38,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +17: [2023-05-13 03:28:38,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +28: [2023-05-13 03:28:38,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +28: [2023-05-13 03:28:38,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +28: [2023-05-13 03:28:38,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +26: [2023-05-13 03:28:38,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +26: [2023-05-13 03:28:38,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +28: [2023-05-13 03:28:38,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +28: [2023-05-13 03:28:38,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +28: [2023-05-13 03:28:38,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +28: [2023-05-13 03:28:38,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +18: [2023-05-13 03:28:38,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +18: [2023-05-13 03:28:38,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +18: [2023-05-13 03:28:38,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +18: [2023-05-13 03:28:38,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +18: [2023-05-13 03:28:38,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +18: [2023-05-13 03:28:38,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +18: [2023-05-13 03:28:38,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +18: [2023-05-13 03:28:38,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +26: [2023-05-13 03:28:38,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +26: [2023-05-13 03:28:38,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +17: [2023-05-13 03:28:38,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +26: [2023-05-13 03:28:38,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +26: [2023-05-13 03:28:38,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +26: [2023-05-13 03:28:38,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +26: [2023-05-13 03:28:38,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +26: [2023-05-13 03:28:38,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +18: [2023-05-13 03:28:38,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +18: [2023-05-13 03:28:38,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +18: [2023-05-13 03:28:38,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +26: [2023-05-13 03:28:38,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +18: [2023-05-13 03:28:38,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +18: [2023-05-13 03:28:38,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +18: [2023-05-13 03:28:38,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +26: [2023-05-13 03:28:38,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +18: [2023-05-13 03:28:38,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +18: [2023-05-13 03:28:38,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +26: [2023-05-13 03:28:38,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +26: [2023-05-13 03:28:38,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +26: [2023-05-13 03:28:38,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +26: [2023-05-13 03:28:38,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +17: [2023-05-13 03:28:38,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +17: [2023-05-13 03:28:38,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +17: [2023-05-13 03:28:38,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +17: [2023-05-13 03:28:38,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +17: [2023-05-13 03:28:38,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +17: [2023-05-13 03:28:38,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +16: [2023-05-13 03:28:38,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +16: [2023-05-13 03:28:38,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +16: [2023-05-13 03:28:38,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +28: [2023-05-13 03:28:38,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:38,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:38,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:38,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:38,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:38,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:38,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +16: [2023-05-13 03:28:38,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +16: [2023-05-13 03:28:38,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +16: [2023-05-13 03:28:38,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +16: [2023-05-13 03:28:38,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +16: [2023-05-13 03:28:38,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +26: [2023-05-13 03:28:38,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +18: [2023-05-13 03:28:38,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +18: [2023-05-13 03:28:38,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +18: [2023-05-13 03:28:38,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +26: [2023-05-13 03:28:38,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +26: [2023-05-13 03:28:38,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +26: [2023-05-13 03:28:38,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:38,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +12: [2023-05-13 03:28:38,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +12: [2023-05-13 03:28:38,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:38,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:38,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +12: [2023-05-13 03:28:38,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +12: [2023-05-13 03:28:38,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +12: [2023-05-13 03:28:38,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +12: [2023-05-13 03:28:38,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +16: [2023-05-13 03:28:38,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +18: [2023-05-13 03:28:38,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +16: [2023-05-13 03:28:38,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +16: [2023-05-13 03:28:38,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +16: [2023-05-13 03:28:38,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +12: [2023-05-13 03:28:38,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +12: [2023-05-13 03:28:38,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +18: [2023-05-13 03:28:38,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +18: [2023-05-13 03:28:38,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +18: [2023-05-13 03:28:38,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +18: [2023-05-13 03:28:38,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +12: [2023-05-13 03:28:38,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +12: [2023-05-13 03:28:38,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +12: [2023-05-13 03:28:38,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +12: [2023-05-13 03:28:38,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +12: [2023-05-13 03:28:38,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +16: [2023-05-13 03:28:38,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +16: [2023-05-13 03:28:38,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +12: [2023-05-13 03:28:38,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +16: [2023-05-13 03:28:38,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +25: [2023-05-13 03:28:38,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +25: [2023-05-13 03:28:38,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +26: [2023-05-13 03:28:38,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +25: [2023-05-13 03:28:38,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +25: [2023-05-13 03:28:38,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +25: [2023-05-13 03:28:38,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +25: [2023-05-13 03:28:38,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +25: [2023-05-13 03:28:38,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +25: [2023-05-13 03:28:38,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +25: [2023-05-13 03:28:38,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +25: [2023-05-13 03:28:38,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +18: [2023-05-13 03:28:38,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +25: [2023-05-13 03:28:38,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +18: [2023-05-13 03:28:38,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +18: [2023-05-13 03:28:38,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +25: [2023-05-13 03:28:38,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +26: [2023-05-13 03:28:38,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +26: [2023-05-13 03:28:38,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +26: [2023-05-13 03:28:38,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +25: [2023-05-13 03:28:38,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +25: [2023-05-13 03:28:38,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +25: [2023-05-13 03:28:38,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +25: [2023-05-13 03:28:38,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +26: [2023-05-13 03:28:38,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +26: [2023-05-13 03:28:38,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +26: [2023-05-13 03:28:38,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +26: [2023-05-13 03:28:38,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +20: [2023-05-13 03:28:38,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +20: [2023-05-13 03:28:38,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +20: [2023-05-13 03:28:38,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +20: [2023-05-13 03:28:38,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +20: [2023-05-13 03:28:38,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +20: [2023-05-13 03:28:38,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +20: [2023-05-13 03:28:38,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +20: [2023-05-13 03:28:38,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +18: [2023-05-13 03:28:38,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +20: [2023-05-13 03:28:38,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +20: [2023-05-13 03:28:38,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +18: [2023-05-13 03:28:38,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +18: [2023-05-13 03:28:38,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +24: [2023-05-13 03:28:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +24: [2023-05-13 03:28:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +24: [2023-05-13 03:28:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +24: [2023-05-13 03:28:38,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +24: [2023-05-13 03:28:38,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +24: [2023-05-13 03:28:38,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +24: [2023-05-13 03:28:38,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +24: [2023-05-13 03:28:38,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +20: [2023-05-13 03:28:38,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +20: [2023-05-13 03:28:38,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +20: [2023-05-13 03:28:38,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +18: [2023-05-13 03:28:38,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +20: [2023-05-13 03:28:38,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +20: [2023-05-13 03:28:38,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +18: [2023-05-13 03:28:38,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +20: [2023-05-13 03:28:38,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +24: [2023-05-13 03:28:38,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +24: [2023-05-13 03:28:38,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +24: [2023-05-13 03:28:38,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +24: [2023-05-13 03:28:38,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +24: [2023-05-13 03:28:38,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +24: [2023-05-13 03:28:38,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +24: [2023-05-13 03:28:38,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +24: [2023-05-13 03:28:38,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +26: [2023-05-13 03:28:38,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +26: [2023-05-13 03:28:38,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:38,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +23: [2023-05-13 03:28:38,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +12: [2023-05-13 03:28:38,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +12: [2023-05-13 03:28:38,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +12: [2023-05-13 03:28:38,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +19: [2023-05-13 03:28:38,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +19: [2023-05-13 03:28:38,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +23: [2023-05-13 03:28:38,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +23: [2023-05-13 03:28:38,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:38,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +23: [2023-05-13 03:28:38,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +23: [2023-05-13 03:28:38,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +23: [2023-05-13 03:28:38,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +23: [2023-05-13 03:28:38,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +25: [2023-05-13 03:28:38,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +25: [2023-05-13 03:28:38,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +12: [2023-05-13 03:28:38,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +12: [2023-05-13 03:28:38,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +19: [2023-05-13 03:28:38,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +19: [2023-05-13 03:28:38,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +19: [2023-05-13 03:28:38,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +19: [2023-05-13 03:28:38,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +19: [2023-05-13 03:28:38,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +19: [2023-05-13 03:28:38,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +23: [2023-05-13 03:28:38,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:38,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +19: [2023-05-13 03:28:38,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +19: [2023-05-13 03:28:38,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +23: [2023-05-13 03:28:38,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +19: [2023-05-13 03:28:38,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:38,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:38,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:38,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:38,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +25: [2023-05-13 03:28:38,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +19: [2023-05-13 03:28:38,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +19: [2023-05-13 03:28:38,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +19: [2023-05-13 03:28:38,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +19: [2023-05-13 03:28:38,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +19: [2023-05-13 03:28:38,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:38,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +12: [2023-05-13 03:28:38,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +25: [2023-05-13 03:28:38,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +12: [2023-05-13 03:28:38,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +25: [2023-05-13 03:28:38,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +20: [2023-05-13 03:28:38,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +20: [2023-05-13 03:28:38,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +25: [2023-05-13 03:28:38,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +25: [2023-05-13 03:28:38,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +12: [2023-05-13 03:28:38,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:38,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +25: [2023-05-13 03:28:38,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +25: [2023-05-13 03:28:38,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +25: [2023-05-13 03:28:38,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +12: [2023-05-13 03:28:38,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:38,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:38,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +24: [2023-05-13 03:28:38,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +25: [2023-05-13 03:28:38,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +24: [2023-05-13 03:28:38,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +24: [2023-05-13 03:28:38,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +24: [2023-05-13 03:28:38,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +20: [2023-05-13 03:28:38,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +25: [2023-05-13 03:28:38,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +12: [2023-05-13 03:28:38,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:38,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:38,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:38,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +20: [2023-05-13 03:28:38,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +20: [2023-05-13 03:28:38,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +20: [2023-05-13 03:28:38,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +20: [2023-05-13 03:28:38,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +20: [2023-05-13 03:28:38,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +25: [2023-05-13 03:28:38,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +24: [2023-05-13 03:28:38,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +24: [2023-05-13 03:28:38,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +24: [2023-05-13 03:28:38,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +24: [2023-05-13 03:28:38,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +20: [2023-05-13 03:28:38,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +25: [2023-05-13 03:28:38,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +25: [2023-05-13 03:28:38,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +25: [2023-05-13 03:28:38,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +24: [2023-05-13 03:28:38,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +20: [2023-05-13 03:28:38,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +19: [2023-05-13 03:28:38,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +19: [2023-05-13 03:28:38,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +19: [2023-05-13 03:28:38,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +23: [2023-05-13 03:28:38,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +20: [2023-05-13 03:28:38,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +24: [2023-05-13 03:28:38,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +19: [2023-05-13 03:28:38,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +23: [2023-05-13 03:28:38,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +24: [2023-05-13 03:28:38,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +24: [2023-05-13 03:28:38,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +23: [2023-05-13 03:28:38,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +20: [2023-05-13 03:28:38,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +24: [2023-05-13 03:28:38,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +20: [2023-05-13 03:28:38,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +20: [2023-05-13 03:28:38,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +23: [2023-05-13 03:28:38,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +19: [2023-05-13 03:28:38,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +19: [2023-05-13 03:28:38,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +19: [2023-05-13 03:28:38,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +19: [2023-05-13 03:28:38,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +24: [2023-05-13 03:28:38,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +24: [2023-05-13 03:28:38,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +24: [2023-05-13 03:28:38,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +20: [2023-05-13 03:28:38,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt... +23: [2023-05-13 03:28:38,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +23: [2023-05-13 03:28:38,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +23: [2023-05-13 03:28:38,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +20: [2023-05-13 03:28:38,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +23: [2023-05-13 03:28:38,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +23: [2023-05-13 03:28:38,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +19: [2023-05-13 03:28:38,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +19: [2023-05-13 03:28:38,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +19: [2023-05-13 03:28:38,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +19: [2023-05-13 03:28:38,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +23: [2023-05-13 03:28:38,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +23: [2023-05-13 03:28:38,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +19: [2023-05-13 03:28:38,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +19: [2023-05-13 03:28:38,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +19: [2023-05-13 03:28:38,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +19: [2023-05-13 03:28:38,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +23: [2023-05-13 03:28:38,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +23: [2023-05-13 03:28:38,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +23: [2023-05-13 03:28:38,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +23: [2023-05-13 03:28:38,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +10: [2023-05-13 03:28:38,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +10: [2023-05-13 03:28:38,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +10: [2023-05-13 03:28:38,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +10: [2023-05-13 03:28:38,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +10: [2023-05-13 03:28:38,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +10: [2023-05-13 03:28:38,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +10: [2023-05-13 03:28:38,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +10: [2023-05-13 03:28:38,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +13: [2023-05-13 03:28:38,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +10: [2023-05-13 03:28:38,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +13: [2023-05-13 03:28:38,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +13: [2023-05-13 03:28:38,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +13: [2023-05-13 03:28:38,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +13: [2023-05-13 03:28:38,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +10: [2023-05-13 03:28:38,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +13: [2023-05-13 03:28:38,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +13: [2023-05-13 03:28:38,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +13: [2023-05-13 03:28:38,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +10: [2023-05-13 03:28:38,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +10: [2023-05-13 03:28:38,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +10: [2023-05-13 03:28:38,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +10: [2023-05-13 03:28:38,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +13: [2023-05-13 03:28:38,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +13: [2023-05-13 03:28:38,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +13: [2023-05-13 03:28:38,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +10: [2023-05-13 03:28:38,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +13: [2023-05-13 03:28:38,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +13: [2023-05-13 03:28:38,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +10: [2023-05-13 03:28:38,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +13: [2023-05-13 03:28:38,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +13: [2023-05-13 03:28:38,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +30: [2023-05-13 03:28:38,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +30: [2023-05-13 03:28:38,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +30: [2023-05-13 03:28:38,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +30: [2023-05-13 03:28:38,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +30: [2023-05-13 03:28:38,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +30: [2023-05-13 03:28:38,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +30: [2023-05-13 03:28:38,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +30: [2023-05-13 03:28:38,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +13: [2023-05-13 03:28:38,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_32-model_00-model_states.pt. +30: [2023-05-13 03:28:38,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +30: [2023-05-13 03:28:38,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:38,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +28: [2023-05-13 03:28:38,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +30: [2023-05-13 03:28:38,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +30: [2023-05-13 03:28:38,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:38,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +28: [2023-05-13 03:28:38,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +28: [2023-05-13 03:28:38,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +28: [2023-05-13 03:28:38,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +28: [2023-05-13 03:28:38,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +28: [2023-05-13 03:28:38,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +30: [2023-05-13 03:28:38,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 7: [2023-05-13 03:28:38,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +30: [2023-05-13 03:28:38,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +30: [2023-05-13 03:28:38,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +30: [2023-05-13 03:28:38,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +28: [2023-05-13 03:28:38,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 7: [2023-05-13 03:28:38,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 7: [2023-05-13 03:28:38,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 7: [2023-05-13 03:28:38,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 7: [2023-05-13 03:28:38,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +15: [2023-05-13 03:28:38,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +15: [2023-05-13 03:28:38,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +15: [2023-05-13 03:28:38,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +26: [2023-05-13 03:28:38,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +26: [2023-05-13 03:28:38,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +15: [2023-05-13 03:28:38,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +15: [2023-05-13 03:28:38,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +15: [2023-05-13 03:28:38,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +15: [2023-05-13 03:28:38,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +15: [2023-05-13 03:28:38,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +26: [2023-05-13 03:28:38,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +26: [2023-05-13 03:28:38,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +28: [2023-05-13 03:28:38,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +26: [2023-05-13 03:28:38,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +26: [2023-05-13 03:28:38,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +26: [2023-05-13 03:28:38,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 7: [2023-05-13 03:28:38,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +15: [2023-05-13 03:28:38,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:38,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:38,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:38,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +28: [2023-05-13 03:28:38,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:38,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +28: [2023-05-13 03:28:38,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +26: [2023-05-13 03:28:38,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +26: [2023-05-13 03:28:38,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +15: [2023-05-13 03:28:38,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +15: [2023-05-13 03:28:38,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +15: [2023-05-13 03:28:38,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +15: [2023-05-13 03:28:38,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +15: [2023-05-13 03:28:38,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +15: [2023-05-13 03:28:38,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +15: [2023-05-13 03:28:38,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +10: [2023-05-13 03:28:38,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +10: [2023-05-13 03:28:38,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +13: [2023-05-13 03:28:38,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +13: [2023-05-13 03:28:38,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 2: [2023-05-13 03:28:38,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 2: [2023-05-13 03:28:38,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 2: [2023-05-13 03:28:38,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 2: [2023-05-13 03:28:38,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 2: [2023-05-13 03:28:38,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 2: [2023-05-13 03:28:38,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 2: [2023-05-13 03:28:38,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 2: [2023-05-13 03:28:38,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +30: [2023-05-13 03:28:38,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:38,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +10: [2023-05-13 03:28:38,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:38,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:38,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +13: [2023-05-13 03:28:38,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:38,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:38,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:38,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:38,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:38,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +13: [2023-05-13 03:28:38,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 2: [2023-05-13 03:28:38,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 2: [2023-05-13 03:28:38,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 6: [2023-05-13 03:28:38,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 6: [2023-05-13 03:28:38,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 6: [2023-05-13 03:28:38,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 6: [2023-05-13 03:28:38,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 6: [2023-05-13 03:28:38,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 6: [2023-05-13 03:28:38,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 6: [2023-05-13 03:28:38,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 6: [2023-05-13 03:28:38,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +28: [2023-05-13 03:28:38,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:38,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +13: [2023-05-13 03:28:38,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 2: [2023-05-13 03:28:38,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 2: [2023-05-13 03:28:38,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 2: [2023-05-13 03:28:38,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 6: [2023-05-13 03:28:38,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 2: [2023-05-13 03:28:38,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 2: [2023-05-13 03:28:38,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +15: [2023-05-13 03:28:38,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 2: [2023-05-13 03:28:38,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +14: [2023-05-13 03:28:38,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:38,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:38,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:38,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:38,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:38,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:38,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:38,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +10: [2023-05-13 03:28:38,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 6: [2023-05-13 03:28:38,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +21: [2023-05-13 03:28:38,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +21: [2023-05-13 03:28:38,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +10: [2023-05-13 03:28:38,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +10: [2023-05-13 03:28:38,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +21: [2023-05-13 03:28:38,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +21: [2023-05-13 03:28:38,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +21: [2023-05-13 03:28:38,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +21: [2023-05-13 03:28:38,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +21: [2023-05-13 03:28:38,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +30: [2023-05-13 03:28:38,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +21: [2023-05-13 03:28:38,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +30: [2023-05-13 03:28:38,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +30: [2023-05-13 03:28:38,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +13: [2023-05-13 03:28:38,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +27: [2023-05-13 03:28:38,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +27: [2023-05-13 03:28:38,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +30: [2023-05-13 03:28:38,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:38,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +27: [2023-05-13 03:28:38,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +14: [2023-05-13 03:28:38,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +27: [2023-05-13 03:28:38,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:38,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +27: [2023-05-13 03:28:38,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +21: [2023-05-13 03:28:38,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 6: [2023-05-13 03:28:38,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 6: [2023-05-13 03:28:38,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 6: [2023-05-13 03:28:38,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +29: [2023-05-13 03:28:38,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +29: [2023-05-13 03:28:38,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +29: [2023-05-13 03:28:38,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +29: [2023-05-13 03:28:38,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +29: [2023-05-13 03:28:38,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +29: [2023-05-13 03:28:38,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +29: [2023-05-13 03:28:38,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +21: [2023-05-13 03:28:38,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +21: [2023-05-13 03:28:38,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +21: [2023-05-13 03:28:38,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +29: [2023-05-13 03:28:38,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 6: [2023-05-13 03:28:38,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +14: [2023-05-13 03:28:38,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 6: [2023-05-13 03:28:38,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +27: [2023-05-13 03:28:38,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +14: [2023-05-13 03:28:38,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 6: [2023-05-13 03:28:38,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +14: [2023-05-13 03:28:38,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +21: [2023-05-13 03:28:38,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:38,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +13: [2023-05-13 03:28:38,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +13: [2023-05-13 03:28:38,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:38,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +13: [2023-05-13 03:28:38,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:38,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +29: [2023-05-13 03:28:38,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +21: [2023-05-13 03:28:38,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +26: [2023-05-13 03:28:38,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +29: [2023-05-13 03:28:38,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +21: [2023-05-13 03:28:38,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +13: [2023-05-13 03:28:38,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +21: [2023-05-13 03:28:38,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:38,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +10: [2023-05-13 03:28:38,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +10: [2023-05-13 03:28:38,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +10: [2023-05-13 03:28:38,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +10: [2023-05-13 03:28:38,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +30: [2023-05-13 03:28:38,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 8: [2023-05-13 03:28:38,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 8: [2023-05-13 03:28:38,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 7: [2023-05-13 03:28:38,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +16: [2023-05-13 03:28:38,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +16: [2023-05-13 03:28:38,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +16: [2023-05-13 03:28:38,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +16: [2023-05-13 03:28:38,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +16: [2023-05-13 03:28:38,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +16: [2023-05-13 03:28:38,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 8: [2023-05-13 03:28:38,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 8: [2023-05-13 03:28:38,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 8: [2023-05-13 03:28:38,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 8: [2023-05-13 03:28:38,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 8: [2023-05-13 03:28:38,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +16: [2023-05-13 03:28:38,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 8: [2023-05-13 03:28:38,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +16: [2023-05-13 03:28:38,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +29: [2023-05-13 03:28:38,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +29: [2023-05-13 03:28:38,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +29: [2023-05-13 03:28:38,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +29: [2023-05-13 03:28:38,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 8: [2023-05-13 03:28:38,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 8: [2023-05-13 03:28:38,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +29: [2023-05-13 03:28:38,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +30: [2023-05-13 03:28:38,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +30: [2023-05-13 03:28:38,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +30: [2023-05-13 03:28:38,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +29: [2023-05-13 03:28:38,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +10: [2023-05-13 03:28:38,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +15: [2023-05-13 03:28:38,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:38,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +13: [2023-05-13 03:28:38,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +13: [2023-05-13 03:28:38,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:38,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +26: [2023-05-13 03:28:38,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +16: [2023-05-13 03:28:38,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +16: [2023-05-13 03:28:38,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +16: [2023-05-13 03:28:38,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +13: [2023-05-13 03:28:38,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:38,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 7: [2023-05-13 03:28:38,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 7: [2023-05-13 03:28:38,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +16: [2023-05-13 03:28:38,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 8: [2023-05-13 03:28:38,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +16: [2023-05-13 03:28:38,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +28: [2023-05-13 03:28:38,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 8: [2023-05-13 03:28:38,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +26: [2023-05-13 03:28:38,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 8: [2023-05-13 03:28:38,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 8: [2023-05-13 03:28:38,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 8: [2023-05-13 03:28:38,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 8: [2023-05-13 03:28:38,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +10: [2023-05-13 03:28:38,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +28: [2023-05-13 03:28:38,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +15: [2023-05-13 03:28:38,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +30: [2023-05-13 03:28:38,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +28: [2023-05-13 03:28:38,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +28: [2023-05-13 03:28:38,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +28: [2023-05-13 03:28:38,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +28: [2023-05-13 03:28:38,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +28: [2023-05-13 03:28:38,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +26: [2023-05-13 03:28:38,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +30: [2023-05-13 03:28:38,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +30: [2023-05-13 03:28:38,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +26: [2023-05-13 03:28:38,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +15: [2023-05-13 03:28:38,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +15: [2023-05-13 03:28:38,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +15: [2023-05-13 03:28:38,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +15: [2023-05-13 03:28:38,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:38,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +13: [2023-05-13 03:28:38,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +13: [2023-05-13 03:28:38,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +13: [2023-05-13 03:28:38,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +30: [2023-05-13 03:28:38,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +15: [2023-05-13 03:28:38,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +15: [2023-05-13 03:28:38,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 5: [2023-05-13 03:28:38,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 5: [2023-05-13 03:28:38,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 5: [2023-05-13 03:28:38,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 5: [2023-05-13 03:28:38,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 5: [2023-05-13 03:28:38,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 5: [2023-05-13 03:28:38,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 5: [2023-05-13 03:28:38,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 5: [2023-05-13 03:28:38,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +10: [2023-05-13 03:28:38,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 2: [2023-05-13 03:28:38,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 2: [2023-05-13 03:28:38,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 5: [2023-05-13 03:28:38,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 5: [2023-05-13 03:28:38,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 5: [2023-05-13 03:28:38,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +30: [2023-05-13 03:28:38,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 5: [2023-05-13 03:28:38,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +10: [2023-05-13 03:28:38,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +10: [2023-05-13 03:28:38,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +10: [2023-05-13 03:28:38,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 5: [2023-05-13 03:28:38,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 5: [2023-05-13 03:28:38,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 5: [2023-05-13 03:28:38,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 5: [2023-05-13 03:28:38,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +30: [2023-05-13 03:28:38,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +14: [2023-05-13 03:28:38,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +30: [2023-05-13 03:28:38,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:38,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +14: [2023-05-13 03:28:38,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 6: [2023-05-13 03:28:38,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +15: [2023-05-13 03:28:38,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +26: [2023-05-13 03:28:38,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +31: [2023-05-13 03:28:38,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +31: [2023-05-13 03:28:38,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +31: [2023-05-13 03:28:38,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +31: [2023-05-13 03:28:38,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +31: [2023-05-13 03:28:38,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +31: [2023-05-13 03:28:38,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +31: [2023-05-13 03:28:38,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +31: [2023-05-13 03:28:38,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:38,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +21: [2023-05-13 03:28:38,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 2: [2023-05-13 03:28:38,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +29: [2023-05-13 03:28:38,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +29: [2023-05-13 03:28:38,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +28: [2023-05-13 03:28:38,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +31: [2023-05-13 03:28:38,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +31: [2023-05-13 03:28:38,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +21: [2023-05-13 03:28:38,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +21: [2023-05-13 03:28:38,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +21: [2023-05-13 03:28:38,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 6: [2023-05-13 03:28:38,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +22: [2023-05-13 03:28:38,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +22: [2023-05-13 03:28:38,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +22: [2023-05-13 03:28:38,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +22: [2023-05-13 03:28:38,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +22: [2023-05-13 03:28:38,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +22: [2023-05-13 03:28:38,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +22: [2023-05-13 03:28:38,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +22: [2023-05-13 03:28:38,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +31: [2023-05-13 03:28:38,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:38,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +31: [2023-05-13 03:28:38,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:38,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 2: [2023-05-13 03:28:38,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +31: [2023-05-13 03:28:38,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:38,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +31: [2023-05-13 03:28:38,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 8: [2023-05-13 03:28:38,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 8: [2023-05-13 03:28:38,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +22: [2023-05-13 03:28:38,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +31: [2023-05-13 03:28:38,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +22: [2023-05-13 03:28:38,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +31: [2023-05-13 03:28:38,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +16: [2023-05-13 03:28:38,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +28: [2023-05-13 03:28:38,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +28: [2023-05-13 03:28:38,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 2: [2023-05-13 03:28:38,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 2: [2023-05-13 03:28:38,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +15: [2023-05-13 03:28:38,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +15: [2023-05-13 03:28:38,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +22: [2023-05-13 03:28:38,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +22: [2023-05-13 03:28:38,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +22: [2023-05-13 03:28:38,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +14: [2023-05-13 03:28:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +12: [2023-05-13 03:28:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +12: [2023-05-13 03:28:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +12: [2023-05-13 03:28:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +22: [2023-05-13 03:28:38,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 2: [2023-05-13 03:28:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 2: [2023-05-13 03:28:38,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 6: [2023-05-13 03:28:38,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +12: [2023-05-13 03:28:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +12: [2023-05-13 03:28:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +12: [2023-05-13 03:28:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +12: [2023-05-13 03:28:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 2: [2023-05-13 03:28:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +12: [2023-05-13 03:28:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +22: [2023-05-13 03:28:38,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +22: [2023-05-13 03:28:38,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 2: [2023-05-13 03:28:38,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:38,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:38,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:38,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:38,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:38,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +21: [2023-05-13 03:28:38,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +15: [2023-05-13 03:28:38,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +11: [2023-05-13 03:28:38,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:38,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +15: [2023-05-13 03:28:38,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +11: [2023-05-13 03:28:38,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +11: [2023-05-13 03:28:38,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +11: [2023-05-13 03:28:38,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +11: [2023-05-13 03:28:38,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +11: [2023-05-13 03:28:38,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +11: [2023-05-13 03:28:38,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +11: [2023-05-13 03:28:38,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:38,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +15: [2023-05-13 03:28:38,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:38,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +11: [2023-05-13 03:28:38,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +29: [2023-05-13 03:28:38,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +15: [2023-05-13 03:28:38,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +21: [2023-05-13 03:28:38,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +21: [2023-05-13 03:28:38,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +21: [2023-05-13 03:28:38,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:38,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:38,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +12: [2023-05-13 03:28:38,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:38,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:38,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:38,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:38,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:38,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:38,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +29: [2023-05-13 03:28:38,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 6: [2023-05-13 03:28:38,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 8: [2023-05-13 03:28:38,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +12: [2023-05-13 03:28:38,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +29: [2023-05-13 03:28:38,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:38,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +21: [2023-05-13 03:28:38,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:38,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +29: [2023-05-13 03:28:38,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +29: [2023-05-13 03:28:38,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +16: [2023-05-13 03:28:38,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +16: [2023-05-13 03:28:38,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +21: [2023-05-13 03:28:38,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:38,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +16: [2023-05-13 03:28:38,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +21: [2023-05-13 03:28:38,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +21: [2023-05-13 03:28:38,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 2: [2023-05-13 03:28:38,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +27: [2023-05-13 03:28:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:38,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 8: [2023-05-13 03:28:38,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +11: [2023-05-13 03:28:38,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +11: [2023-05-13 03:28:38,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 8: [2023-05-13 03:28:38,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +11: [2023-05-13 03:28:38,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +11: [2023-05-13 03:28:38,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +11: [2023-05-13 03:28:38,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 6: [2023-05-13 03:28:38,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 6: [2023-05-13 03:28:38,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 6: [2023-05-13 03:28:38,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 6: [2023-05-13 03:28:38,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 6: [2023-05-13 03:28:38,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +11: [2023-05-13 03:28:38,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 6: [2023-05-13 03:28:38,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:38,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +11: [2023-05-13 03:28:38,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +29: [2023-05-13 03:28:38,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +29: [2023-05-13 03:28:38,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +29: [2023-05-13 03:28:38,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 5: [2023-05-13 03:28:38,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 5: [2023-05-13 03:28:38,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +24: [2023-05-13 03:28:38,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +24: [2023-05-13 03:28:38,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +24: [2023-05-13 03:28:38,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +24: [2023-05-13 03:28:38,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +24: [2023-05-13 03:28:38,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +24: [2023-05-13 03:28:38,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +24: [2023-05-13 03:28:38,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +24: [2023-05-13 03:28:38,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 8: [2023-05-13 03:28:38,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 8: [2023-05-13 03:28:38,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 8: [2023-05-13 03:28:38,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +21: [2023-05-13 03:28:38,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 8: [2023-05-13 03:28:38,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 8: [2023-05-13 03:28:38,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +25: [2023-05-13 03:28:38,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +25: [2023-05-13 03:28:38,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +25: [2023-05-13 03:28:38,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +25: [2023-05-13 03:28:38,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +25: [2023-05-13 03:28:38,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +25: [2023-05-13 03:28:38,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +25: [2023-05-13 03:28:38,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:38,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 2: [2023-05-13 03:28:38,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +18: [2023-05-13 03:28:38,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +25: [2023-05-13 03:28:38,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +18: [2023-05-13 03:28:38,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +18: [2023-05-13 03:28:38,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +18: [2023-05-13 03:28:38,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +18: [2023-05-13 03:28:38,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +18: [2023-05-13 03:28:38,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +18: [2023-05-13 03:28:38,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +18: [2023-05-13 03:28:38,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +16: [2023-05-13 03:28:38,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +14: [2023-05-13 03:28:38,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +24: [2023-05-13 03:28:38,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +24: [2023-05-13 03:28:38,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +24: [2023-05-13 03:28:38,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +21: [2023-05-13 03:28:38,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +24: [2023-05-13 03:28:38,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 8: [2023-05-13 03:28:38,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +18: [2023-05-13 03:28:38,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 5: [2023-05-13 03:28:38,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 5: [2023-05-13 03:28:38,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +25: [2023-05-13 03:28:38,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +25: [2023-05-13 03:28:38,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +18: [2023-05-13 03:28:38,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +29: [2023-05-13 03:28:38,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +25: [2023-05-13 03:28:38,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +18: [2023-05-13 03:28:38,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 2: [2023-05-13 03:28:38,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +21: [2023-05-13 03:28:38,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +24: [2023-05-13 03:28:38,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +24: [2023-05-13 03:28:38,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 2: [2023-05-13 03:28:38,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +21: [2023-05-13 03:28:38,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +24: [2023-05-13 03:28:38,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +24: [2023-05-13 03:28:38,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +14: [2023-05-13 03:28:38,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 5: [2023-05-13 03:28:38,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 5: [2023-05-13 03:28:38,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 5: [2023-05-13 03:28:38,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 5: [2023-05-13 03:28:38,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +18: [2023-05-13 03:28:38,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +18: [2023-05-13 03:28:38,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +25: [2023-05-13 03:28:38,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +25: [2023-05-13 03:28:38,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +25: [2023-05-13 03:28:38,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +18: [2023-05-13 03:28:38,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +25: [2023-05-13 03:28:38,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +14: [2023-05-13 03:28:38,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +14: [2023-05-13 03:28:38,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +14: [2023-05-13 03:28:38,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +29: [2023-05-13 03:28:38,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +25: [2023-05-13 03:28:38,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +16: [2023-05-13 03:28:38,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +18: [2023-05-13 03:28:38,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +18: [2023-05-13 03:28:38,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 2: [2023-05-13 03:28:38,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 2: [2023-05-13 03:28:38,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +29: [2023-05-13 03:28:38,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +31: [2023-05-13 03:28:38,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:38,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +31: [2023-05-13 03:28:38,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +16: [2023-05-13 03:28:38,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:38,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:38,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 6: [2023-05-13 03:28:38,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +23: [2023-05-13 03:28:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +23: [2023-05-13 03:28:38,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +23: [2023-05-13 03:28:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +23: [2023-05-13 03:28:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +23: [2023-05-13 03:28:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +23: [2023-05-13 03:28:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +23: [2023-05-13 03:28:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +23: [2023-05-13 03:28:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +11: [2023-05-13 03:28:38,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +27: [2023-05-13 03:28:38,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 5: [2023-05-13 03:28:38,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +22: [2023-05-13 03:28:38,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:38,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 6: [2023-05-13 03:28:38,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +23: [2023-05-13 03:28:38,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +29: [2023-05-13 03:28:38,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +22: [2023-05-13 03:28:38,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +23: [2023-05-13 03:28:38,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 5: [2023-05-13 03:28:38,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +29: [2023-05-13 03:28:38,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +29: [2023-05-13 03:28:38,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 6: [2023-05-13 03:28:38,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 6: [2023-05-13 03:28:38,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +27: [2023-05-13 03:28:38,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 6: [2023-05-13 03:28:38,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +27: [2023-05-13 03:28:38,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 6: [2023-05-13 03:28:38,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:38,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +23: [2023-05-13 03:28:38,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +23: [2023-05-13 03:28:38,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +23: [2023-05-13 03:28:38,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +23: [2023-05-13 03:28:38,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 8: [2023-05-13 03:28:38,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +20: [2023-05-13 03:28:38,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +20: [2023-05-13 03:28:38,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +23: [2023-05-13 03:28:38,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +23: [2023-05-13 03:28:38,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 8: [2023-05-13 03:28:38,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 8: [2023-05-13 03:28:38,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 5: [2023-05-13 03:28:38,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 5: [2023-05-13 03:28:38,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 8: [2023-05-13 03:28:38,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +20: [2023-05-13 03:28:38,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +20: [2023-05-13 03:28:38,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +20: [2023-05-13 03:28:38,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +20: [2023-05-13 03:28:38,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +20: [2023-05-13 03:28:38,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +20: [2023-05-13 03:28:38,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +19: [2023-05-13 03:28:38,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +31: [2023-05-13 03:28:38,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +19: [2023-05-13 03:28:38,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +19: [2023-05-13 03:28:38,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +19: [2023-05-13 03:28:38,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +19: [2023-05-13 03:28:38,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +19: [2023-05-13 03:28:38,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +19: [2023-05-13 03:28:38,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +19: [2023-05-13 03:28:38,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 8: [2023-05-13 03:28:38,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +31: [2023-05-13 03:28:38,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +20: [2023-05-13 03:28:38,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +20: [2023-05-13 03:28:38,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +12: [2023-05-13 03:28:38,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +12: [2023-05-13 03:28:38,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +31: [2023-05-13 03:28:38,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +31: [2023-05-13 03:28:38,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +31: [2023-05-13 03:28:38,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +12: [2023-05-13 03:28:38,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +11: [2023-05-13 03:28:38,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +12: [2023-05-13 03:28:38,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +31: [2023-05-13 03:28:38,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +31: [2023-05-13 03:28:38,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +31: [2023-05-13 03:28:38,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 5: [2023-05-13 03:28:38,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 5: [2023-05-13 03:28:38,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +19: [2023-05-13 03:28:38,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 5: [2023-05-13 03:28:38,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +20: [2023-05-13 03:28:38,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +19: [2023-05-13 03:28:38,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +20: [2023-05-13 03:28:38,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +19: [2023-05-13 03:28:38,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 5: [2023-05-13 03:28:38,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +20: [2023-05-13 03:28:38,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +19: [2023-05-13 03:28:38,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +20: [2023-05-13 03:28:38,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +20: [2023-05-13 03:28:38,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +19: [2023-05-13 03:28:38,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +20: [2023-05-13 03:28:38,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +19: [2023-05-13 03:28:38,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +19: [2023-05-13 03:28:38,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +19: [2023-05-13 03:28:38,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +22: [2023-05-13 03:28:38,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +22: [2023-05-13 03:28:38,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +22: [2023-05-13 03:28:38,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +22: [2023-05-13 03:28:38,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +22: [2023-05-13 03:28:38,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +22: [2023-05-13 03:28:38,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +22: [2023-05-13 03:28:38,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +22: [2023-05-13 03:28:38,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +12: [2023-05-13 03:28:38,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +12: [2023-05-13 03:28:38,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +12: [2023-05-13 03:28:38,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +12: [2023-05-13 03:28:38,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +24: [2023-05-13 03:28:38,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +18: [2023-05-13 03:28:38,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +12: [2023-05-13 03:28:38,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +25: [2023-05-13 03:28:38,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +25: [2023-05-13 03:28:38,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +25: [2023-05-13 03:28:38,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +11: [2023-05-13 03:28:38,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +11: [2023-05-13 03:28:38,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +11: [2023-05-13 03:28:38,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +12: [2023-05-13 03:28:38,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:38,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +24: [2023-05-13 03:28:38,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 3: [2023-05-13 03:28:38,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +24: [2023-05-13 03:28:38,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +18: [2023-05-13 03:28:38,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +18: [2023-05-13 03:28:38,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +31: [2023-05-13 03:28:38,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +11: [2023-05-13 03:28:38,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +11: [2023-05-13 03:28:38,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +11: [2023-05-13 03:28:38,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +24: [2023-05-13 03:28:38,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +31: [2023-05-13 03:28:38,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +12: [2023-05-13 03:28:38,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +12: [2023-05-13 03:28:38,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +25: [2023-05-13 03:28:38,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +31: [2023-05-13 03:28:38,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt... +18: [2023-05-13 03:28:38,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 0: [2023-05-13 03:28:38,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 0: [2023-05-13 03:28:38,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +18: [2023-05-13 03:28:38,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +24: [2023-05-13 03:28:38,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +23: [2023-05-13 03:28:38,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +31: [2023-05-13 03:28:38,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +24: [2023-05-13 03:28:38,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +31: [2023-05-13 03:28:38,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +25: [2023-05-13 03:28:38,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +25: [2023-05-13 03:28:38,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +25: [2023-05-13 03:28:38,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +31: [2023-05-13 03:28:38,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +25: [2023-05-13 03:28:38,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +22: [2023-05-13 03:28:38,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +23: [2023-05-13 03:28:38,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +18: [2023-05-13 03:28:38,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +18: [2023-05-13 03:28:38,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +18: [2023-05-13 03:28:38,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +18: [2023-05-13 03:28:38,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +24: [2023-05-13 03:28:38,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +24: [2023-05-13 03:28:38,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +24: [2023-05-13 03:28:38,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +22: [2023-05-13 03:28:38,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +22: [2023-05-13 03:28:38,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +22: [2023-05-13 03:28:38,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +12: [2023-05-13 03:28:38,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +12: [2023-05-13 03:28:38,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +22: [2023-05-13 03:28:38,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +12: [2023-05-13 03:28:38,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +22: [2023-05-13 03:28:38,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +12: [2023-05-13 03:28:38,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +25: [2023-05-13 03:28:38,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +25: [2023-05-13 03:28:38,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +18: [2023-05-13 03:28:38,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +25: [2023-05-13 03:28:38,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +24: [2023-05-13 03:28:38,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +24: [2023-05-13 03:28:38,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +18: [2023-05-13 03:28:38,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +24: [2023-05-13 03:28:38,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +20: [2023-05-13 03:28:38,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +20: [2023-05-13 03:28:38,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +17: [2023-05-13 03:28:38,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +17: [2023-05-13 03:28:38,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +17: [2023-05-13 03:28:38,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +17: [2023-05-13 03:28:38,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +17: [2023-05-13 03:28:38,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +17: [2023-05-13 03:28:38,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +17: [2023-05-13 03:28:38,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +19: [2023-05-13 03:28:38,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +17: [2023-05-13 03:28:38,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +19: [2023-05-13 03:28:38,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +19: [2023-05-13 03:28:38,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +23: [2023-05-13 03:28:38,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +17: [2023-05-13 03:28:38,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +24: [2023-05-13 03:28:38,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +23: [2023-05-13 03:28:38,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +23: [2023-05-13 03:28:38,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +23: [2023-05-13 03:28:38,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +26: [2023-05-13 03:28:38,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +26: [2023-05-13 03:28:38,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +26: [2023-05-13 03:28:38,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +23: [2023-05-13 03:28:38,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +23: [2023-05-13 03:28:38,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +18: [2023-05-13 03:28:38,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +23: [2023-05-13 03:28:38,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +25: [2023-05-13 03:28:38,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +26: [2023-05-13 03:28:38,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 1: [2023-05-13 03:28:38,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +26: [2023-05-13 03:28:38,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +26: [2023-05-13 03:28:38,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +26: [2023-05-13 03:28:38,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +26: [2023-05-13 03:28:38,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +17: [2023-05-13 03:28:38,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +18: [2023-05-13 03:28:38,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +25: [2023-05-13 03:28:38,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +26: [2023-05-13 03:28:38,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +24: [2023-05-13 03:28:38,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +23: [2023-05-13 03:28:38,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +24: [2023-05-13 03:28:38,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +17: [2023-05-13 03:28:38,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +25: [2023-05-13 03:28:38,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 1: [2023-05-13 03:28:38,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +19: [2023-05-13 03:28:38,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +19: [2023-05-13 03:28:38,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +26: [2023-05-13 03:28:38,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +11: [2023-05-13 03:28:38,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +11: [2023-05-13 03:28:38,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +11: [2023-05-13 03:28:38,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +11: [2023-05-13 03:28:38,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +11: [2023-05-13 03:28:38,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +11: [2023-05-13 03:28:38,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +25: [2023-05-13 03:28:38,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +20: [2023-05-13 03:28:38,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +17: [2023-05-13 03:28:38,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +20: [2023-05-13 03:28:38,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +19: [2023-05-13 03:28:38,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +19: [2023-05-13 03:28:38,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +19: [2023-05-13 03:28:38,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +24: [2023-05-13 03:28:38,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +17: [2023-05-13 03:28:38,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +25: [2023-05-13 03:28:38,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +17: [2023-05-13 03:28:38,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +17: [2023-05-13 03:28:38,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +18: [2023-05-13 03:28:38,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +18: [2023-05-13 03:28:38,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +26: [2023-05-13 03:28:38,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +17: [2023-05-13 03:28:38,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +26: [2023-05-13 03:28:38,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +18: [2023-05-13 03:28:38,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +20: [2023-05-13 03:28:38,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +20: [2023-05-13 03:28:38,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +20: [2023-05-13 03:28:38,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +20: [2023-05-13 03:28:38,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +20: [2023-05-13 03:28:38,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +20: [2023-05-13 03:28:38,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 9: [2023-05-13 03:28:38,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +19: [2023-05-13 03:28:38,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +19: [2023-05-13 03:28:38,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +19: [2023-05-13 03:28:38,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_33-model_00-model_states.pt. +23: [2023-05-13 03:28:38,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +23: [2023-05-13 03:28:38,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 9: [2023-05-13 03:28:38,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +23: [2023-05-13 03:28:38,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +19: [2023-05-13 03:28:38,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +20: [2023-05-13 03:28:38,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +23: [2023-05-13 03:28:38,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +23: [2023-05-13 03:28:38,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +23: [2023-05-13 03:28:38,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +19: [2023-05-13 03:28:38,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +20: [2023-05-13 03:28:38,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +19: [2023-05-13 03:28:38,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +19: [2023-05-13 03:28:38,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +19: [2023-05-13 03:28:38,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +17: [2023-05-13 03:28:38,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +11: [2023-05-13 03:28:38,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +20: [2023-05-13 03:28:38,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +20: [2023-05-13 03:28:38,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +20: [2023-05-13 03:28:38,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +11: [2023-05-13 03:28:38,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +20: [2023-05-13 03:28:38,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +26: [2023-05-13 03:28:38,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +26: [2023-05-13 03:28:38,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +26: [2023-05-13 03:28:38,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +26: [2023-05-13 03:28:38,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +26: [2023-05-13 03:28:38,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +17: [2023-05-13 03:28:38,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +17: [2023-05-13 03:28:38,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +17: [2023-05-13 03:28:38,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +26: [2023-05-13 03:28:38,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +26: [2023-05-13 03:28:38,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +26: [2023-05-13 03:28:38,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +26: [2023-05-13 03:28:38,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +26: [2023-05-13 03:28:38,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +26: [2023-05-13 03:28:38,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +26: [2023-05-13 03:28:38,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +17: [2023-05-13 03:28:38,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +17: [2023-05-13 03:28:38,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +26: [2023-05-13 03:28:38,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +17: [2023-05-13 03:28:38,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +17: [2023-05-13 03:28:38,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +17: [2023-05-13 03:28:38,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +17: [2023-05-13 03:28:38,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +17: [2023-05-13 03:28:38,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +26: [2023-05-13 03:28:38,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +26: [2023-05-13 03:28:38,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +26: [2023-05-13 03:28:38,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +17: [2023-05-13 03:28:38,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +17: [2023-05-13 03:28:38,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +17: [2023-05-13 03:28:38,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +17: [2023-05-13 03:28:38,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +17: [2023-05-13 03:28:38,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +12: [2023-05-13 03:28:38,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +12: [2023-05-13 03:28:38,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +12: [2023-05-13 03:28:38,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +12: [2023-05-13 03:28:38,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +12: [2023-05-13 03:28:38,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +12: [2023-05-13 03:28:38,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +12: [2023-05-13 03:28:38,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +12: [2023-05-13 03:28:38,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +12: [2023-05-13 03:28:38,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +12: [2023-05-13 03:28:38,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +12: [2023-05-13 03:28:38,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +12: [2023-05-13 03:28:38,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +12: [2023-05-13 03:28:38,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +12: [2023-05-13 03:28:38,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +12: [2023-05-13 03:28:38,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +12: [2023-05-13 03:28:38,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +15: [2023-05-13 03:28:38,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +15: [2023-05-13 03:28:38,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +15: [2023-05-13 03:28:38,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +15: [2023-05-13 03:28:38,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +15: [2023-05-13 03:28:38,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +15: [2023-05-13 03:28:38,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +15: [2023-05-13 03:28:38,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +15: [2023-05-13 03:28:38,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +15: [2023-05-13 03:28:38,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +15: [2023-05-13 03:28:38,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +15: [2023-05-13 03:28:38,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +15: [2023-05-13 03:28:38,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +15: [2023-05-13 03:28:38,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +15: [2023-05-13 03:28:38,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +15: [2023-05-13 03:28:38,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +15: [2023-05-13 03:28:38,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +12: [2023-05-13 03:28:38,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +20: [2023-05-13 03:28:38,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +20: [2023-05-13 03:28:38,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +20: [2023-05-13 03:28:38,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +20: [2023-05-13 03:28:38,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +20: [2023-05-13 03:28:38,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +20: [2023-05-13 03:28:38,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +20: [2023-05-13 03:28:38,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +20: [2023-05-13 03:28:38,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +20: [2023-05-13 03:28:38,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +20: [2023-05-13 03:28:38,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:38,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +12: [2023-05-13 03:28:38,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +12: [2023-05-13 03:28:38,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +12: [2023-05-13 03:28:38,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +20: [2023-05-13 03:28:38,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +20: [2023-05-13 03:28:38,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +20: [2023-05-13 03:28:38,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +20: [2023-05-13 03:28:38,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +20: [2023-05-13 03:28:38,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +20: [2023-05-13 03:28:38,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt... +12: [2023-05-13 03:28:38,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +15: [2023-05-13 03:28:38,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +12: [2023-05-13 03:28:38,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +12: [2023-05-13 03:28:38,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +12: [2023-05-13 03:28:38,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +12: [2023-05-13 03:28:38,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +12: [2023-05-13 03:28:38,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +12: [2023-05-13 03:28:38,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +12: [2023-05-13 03:28:38,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +15: [2023-05-13 03:28:38,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +15: [2023-05-13 03:28:38,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +12: [2023-05-13 03:28:38,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +12: [2023-05-13 03:28:38,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +12: [2023-05-13 03:28:38,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +15: [2023-05-13 03:28:38,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +15: [2023-05-13 03:28:38,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +15: [2023-05-13 03:28:38,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +20: [2023-05-13 03:28:38,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +20: [2023-05-13 03:28:38,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +15: [2023-05-13 03:28:38,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +15: [2023-05-13 03:28:38,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +15: [2023-05-13 03:28:38,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +15: [2023-05-13 03:28:38,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +15: [2023-05-13 03:28:38,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +15: [2023-05-13 03:28:38,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +15: [2023-05-13 03:28:38,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +15: [2023-05-13 03:28:38,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +15: [2023-05-13 03:28:38,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +15: [2023-05-13 03:28:38,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +20: [2023-05-13 03:28:38,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +20: [2023-05-13 03:28:38,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +20: [2023-05-13 03:28:38,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +20: [2023-05-13 03:28:38,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +20: [2023-05-13 03:28:38,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +20: [2023-05-13 03:28:38,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +20: [2023-05-13 03:28:38,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. +20: [2023-05-13 03:28:38,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_34-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +15: [2023-05-13 03:28:38,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:38,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +15: [2023-05-13 03:28:38,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +15: [2023-05-13 03:28:38,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +15: [2023-05-13 03:28:38,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +15: [2023-05-13 03:28:38,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +15: [2023-05-13 03:28:38,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +15: [2023-05-13 03:28:38,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +15: [2023-05-13 03:28:38,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +15: [2023-05-13 03:28:38,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +10: [2023-05-13 03:28:38,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +10: [2023-05-13 03:28:38,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +10: [2023-05-13 03:28:38,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +10: [2023-05-13 03:28:38,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +10: [2023-05-13 03:28:38,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +10: [2023-05-13 03:28:38,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +10: [2023-05-13 03:28:38,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 4: [2023-05-13 03:28:38,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +15: [2023-05-13 03:28:38,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +15: [2023-05-13 03:28:38,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +10: [2023-05-13 03:28:38,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +15: [2023-05-13 03:28:38,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +15: [2023-05-13 03:28:38,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +15: [2023-05-13 03:28:38,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +15: [2023-05-13 03:28:38,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +10: [2023-05-13 03:28:38,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +15: [2023-05-13 03:28:38,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +10: [2023-05-13 03:28:38,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +15: [2023-05-13 03:28:38,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +15: [2023-05-13 03:28:38,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +15: [2023-05-13 03:28:38,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +15: [2023-05-13 03:28:38,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +15: [2023-05-13 03:28:38,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +15: [2023-05-13 03:28:38,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +15: [2023-05-13 03:28:38,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +15: [2023-05-13 03:28:38,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +10: [2023-05-13 03:28:38,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +10: [2023-05-13 03:28:38,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +10: [2023-05-13 03:28:38,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +10: [2023-05-13 03:28:38,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +10: [2023-05-13 03:28:38,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +20: [2023-05-13 03:28:38,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +10: [2023-05-13 03:28:38,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +20: [2023-05-13 03:28:38,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +20: [2023-05-13 03:28:38,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +20: [2023-05-13 03:28:38,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +20: [2023-05-13 03:28:38,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +20: [2023-05-13 03:28:38,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +10: [2023-05-13 03:28:38,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +10: [2023-05-13 03:28:38,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +15: [2023-05-13 03:28:38,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt... +15: [2023-05-13 03:28:38,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt... +15: [2023-05-13 03:28:38,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt... +15: [2023-05-13 03:28:38,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt... +15: [2023-05-13 03:28:38,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt... +15: [2023-05-13 03:28:38,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt... +15: [2023-05-13 03:28:38,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt... +15: [2023-05-13 03:28:38,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt... +14: [2023-05-13 03:28:38,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +14: [2023-05-13 03:28:38,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +14: [2023-05-13 03:28:38,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +14: [2023-05-13 03:28:38,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +14: [2023-05-13 03:28:38,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +14: [2023-05-13 03:28:38,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +10: [2023-05-13 03:28:38,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +14: [2023-05-13 03:28:38,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +14: [2023-05-13 03:28:38,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +14: [2023-05-13 03:28:38,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +14: [2023-05-13 03:28:38,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +14: [2023-05-13 03:28:38,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +14: [2023-05-13 03:28:38,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +10: [2023-05-13 03:28:38,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +10: [2023-05-13 03:28:38,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +14: [2023-05-13 03:28:38,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +14: [2023-05-13 03:28:38,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +14: [2023-05-13 03:28:38,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +14: [2023-05-13 03:28:38,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +10: [2023-05-13 03:28:38,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +10: [2023-05-13 03:28:38,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +10: [2023-05-13 03:28:38,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +10: [2023-05-13 03:28:38,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +10: [2023-05-13 03:28:38,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +10: [2023-05-13 03:28:38,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 7: [2023-05-13 03:28:38,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 7: [2023-05-13 03:28:38,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 7: [2023-05-13 03:28:38,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 7: [2023-05-13 03:28:38,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 7: [2023-05-13 03:28:38,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 7: [2023-05-13 03:28:38,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 7: [2023-05-13 03:28:38,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 7: [2023-05-13 03:28:38,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +10: [2023-05-13 03:28:38,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +10: [2023-05-13 03:28:38,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +10: [2023-05-13 03:28:38,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +10: [2023-05-13 03:28:38,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +10: [2023-05-13 03:28:38,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +28: [2023-05-13 03:28:38,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +28: [2023-05-13 03:28:38,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +28: [2023-05-13 03:28:38,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +28: [2023-05-13 03:28:38,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +28: [2023-05-13 03:28:38,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +28: [2023-05-13 03:28:38,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +28: [2023-05-13 03:28:38,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +28: [2023-05-13 03:28:38,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 7: [2023-05-13 03:28:38,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +28: [2023-05-13 03:28:38,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +13: [2023-05-13 03:28:38,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +13: [2023-05-13 03:28:38,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +13: [2023-05-13 03:28:38,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +13: [2023-05-13 03:28:38,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +13: [2023-05-13 03:28:38,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +13: [2023-05-13 03:28:38,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +13: [2023-05-13 03:28:38,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +13: [2023-05-13 03:28:38,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 7: [2023-05-13 03:28:38,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 7: [2023-05-13 03:28:38,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +13: [2023-05-13 03:28:38,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +13: [2023-05-13 03:28:38,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +13: [2023-05-13 03:28:38,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +13: [2023-05-13 03:28:38,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +28: [2023-05-13 03:28:38,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +28: [2023-05-13 03:28:38,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +13: [2023-05-13 03:28:38,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +13: [2023-05-13 03:28:38,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +28: [2023-05-13 03:28:38,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +28: [2023-05-13 03:28:38,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +28: [2023-05-13 03:28:38,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +13: [2023-05-13 03:28:38,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +13: [2023-05-13 03:28:38,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +28: [2023-05-13 03:28:38,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +28: [2023-05-13 03:28:38,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +27: [2023-05-13 03:28:38,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +27: [2023-05-13 03:28:38,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +27: [2023-05-13 03:28:38,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +27: [2023-05-13 03:28:38,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +27: [2023-05-13 03:28:38,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +27: [2023-05-13 03:28:38,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +27: [2023-05-13 03:28:38,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +27: [2023-05-13 03:28:38,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +27: [2023-05-13 03:28:38,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +27: [2023-05-13 03:28:38,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +27: [2023-05-13 03:28:39,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +27: [2023-05-13 03:28:39,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +27: [2023-05-13 03:28:39,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +27: [2023-05-13 03:28:39,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +27: [2023-05-13 03:28:39,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +14: [2023-05-13 03:28:39,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +27: [2023-05-13 03:28:39,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +10: [2023-05-13 03:28:38,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +10: [2023-05-13 03:28:38,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +10: [2023-05-13 03:28:38,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +10: [2023-05-13 03:28:38,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +10: [2023-05-13 03:28:38,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +10: [2023-05-13 03:28:38,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +10: [2023-05-13 03:28:38,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +10: [2023-05-13 03:28:38,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +10: [2023-05-13 03:28:39,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +10: [2023-05-13 03:28:39,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +10: [2023-05-13 03:28:39,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +10: [2023-05-13 03:28:39,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +10: [2023-05-13 03:28:39,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +10: [2023-05-13 03:28:39,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +10: [2023-05-13 03:28:39,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +10: [2023-05-13 03:28:39,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +10: [2023-05-13 03:28:39,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +10: [2023-05-13 03:28:39,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +10: [2023-05-13 03:28:39,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +10: [2023-05-13 03:28:39,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +10: [2023-05-13 03:28:39,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +10: [2023-05-13 03:28:39,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +10: [2023-05-13 03:28:39,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +10: [2023-05-13 03:28:39,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +30: [2023-05-13 03:28:39,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +30: [2023-05-13 03:28:39,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +30: [2023-05-13 03:28:39,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +30: [2023-05-13 03:28:39,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +30: [2023-05-13 03:28:39,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +30: [2023-05-13 03:28:39,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +30: [2023-05-13 03:28:39,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +30: [2023-05-13 03:28:39,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +14: [2023-05-13 03:28:39,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +14: [2023-05-13 03:28:39,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +30: [2023-05-13 03:28:39,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +30: [2023-05-13 03:28:39,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +30: [2023-05-13 03:28:39,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +30: [2023-05-13 03:28:39,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +28: [2023-05-13 03:28:39,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +30: [2023-05-13 03:28:39,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +30: [2023-05-13 03:28:39,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +30: [2023-05-13 03:28:39,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +14: [2023-05-13 03:28:39,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +30: [2023-05-13 03:28:39,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +21: [2023-05-13 03:28:39,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +21: [2023-05-13 03:28:39,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +21: [2023-05-13 03:28:39,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +21: [2023-05-13 03:28:39,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +21: [2023-05-13 03:28:39,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +21: [2023-05-13 03:28:39,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +21: [2023-05-13 03:28:39,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +21: [2023-05-13 03:28:39,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +21: [2023-05-13 03:28:39,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +14: [2023-05-13 03:28:39,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +14: [2023-05-13 03:28:39,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +14: [2023-05-13 03:28:39,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +14: [2023-05-13 03:28:39,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +14: [2023-05-13 03:28:39,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +21: [2023-05-13 03:28:39,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +21: [2023-05-13 03:28:39,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +14: [2023-05-13 03:28:39,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +14: [2023-05-13 03:28:39,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +21: [2023-05-13 03:28:39,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +13: [2023-05-13 03:28:39,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +13: [2023-05-13 03:28:39,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +14: [2023-05-13 03:28:39,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +21: [2023-05-13 03:28:39,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +21: [2023-05-13 03:28:39,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +21: [2023-05-13 03:28:39,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +21: [2023-05-13 03:28:39,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +28: [2023-05-13 03:28:39,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +13: [2023-05-13 03:28:39,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +14: [2023-05-13 03:28:39,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:39,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +28: [2023-05-13 03:28:39,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +14: [2023-05-13 03:28:39,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +28: [2023-05-13 03:28:39,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:39,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +28: [2023-05-13 03:28:39,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +27: [2023-05-13 03:28:39,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +14: [2023-05-13 03:28:39,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +14: [2023-05-13 03:28:39,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +14: [2023-05-13 03:28:39,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +14: [2023-05-13 03:28:39,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +13: [2023-05-13 03:28:39,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +13: [2023-05-13 03:28:39,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +13: [2023-05-13 03:28:39,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +13: [2023-05-13 03:28:39,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +13: [2023-05-13 03:28:39,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +20: [2023-05-13 03:28:39,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +20: [2023-05-13 03:28:39,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +14: [2023-05-13 03:28:39,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +20: [2023-05-13 03:28:39,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +20: [2023-05-13 03:28:39,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +20: [2023-05-13 03:28:39,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +20: [2023-05-13 03:28:39,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:39,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +14: [2023-05-13 03:28:39,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +14: [2023-05-13 03:28:39,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +28: [2023-05-13 03:28:39,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +28: [2023-05-13 03:28:39,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +28: [2023-05-13 03:28:39,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +20: [2023-05-13 03:28:39,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +20: [2023-05-13 03:28:39,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +28: [2023-05-13 03:28:39,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +28: [2023-05-13 03:28:39,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +28: [2023-05-13 03:28:39,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +28: [2023-05-13 03:28:39,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 7: [2023-05-13 03:28:39,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 7: [2023-05-13 03:28:39,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +13: [2023-05-13 03:28:39,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +13: [2023-05-13 03:28:39,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 7: [2023-05-13 03:28:39,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +14: [2023-05-13 03:28:39,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +14: [2023-05-13 03:28:39,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +27: [2023-05-13 03:28:39,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +14: [2023-05-13 03:28:39,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +14: [2023-05-13 03:28:39,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +14: [2023-05-13 03:28:39,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +14: [2023-05-13 03:28:39,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +14: [2023-05-13 03:28:39,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +14: [2023-05-13 03:28:39,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +20: [2023-05-13 03:28:39,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +20: [2023-05-13 03:28:39,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 7: [2023-05-13 03:28:39,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 7: [2023-05-13 03:28:39,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... + 7: [2023-05-13 03:28:39,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +14: [2023-05-13 03:28:39,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt... +14: [2023-05-13 03:28:39,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +14: [2023-05-13 03:28:39,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +14: [2023-05-13 03:28:39,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +27: [2023-05-13 03:28:39,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +10: [2023-05-13 03:28:39,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt... +10: [2023-05-13 03:28:39,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt... +27: [2023-05-13 03:28:39,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +10: [2023-05-13 03:28:39,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt... +10: [2023-05-13 03:28:39,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt... +10: [2023-05-13 03:28:39,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt... +10: [2023-05-13 03:28:39,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt... +10: [2023-05-13 03:28:39,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt... +10: [2023-05-13 03:28:39,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt... +14: [2023-05-13 03:28:39,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 7: [2023-05-13 03:28:39,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +27: [2023-05-13 03:28:39,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +14: [2023-05-13 03:28:39,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +14: [2023-05-13 03:28:39,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 7: [2023-05-13 03:28:39,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +14: [2023-05-13 03:28:39,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +13: [2023-05-13 03:28:39,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +13: [2023-05-13 03:28:39,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +13: [2023-05-13 03:28:39,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +13: [2023-05-13 03:28:39,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +13: [2023-05-13 03:28:39,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +13: [2023-05-13 03:28:39,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +13: [2023-05-13 03:28:39,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 7: [2023-05-13 03:28:39,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +13: [2023-05-13 03:28:39,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +13: [2023-05-13 03:28:39,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +13: [2023-05-13 03:28:39,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +13: [2023-05-13 03:28:39,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +30: [2023-05-13 03:28:39,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +30: [2023-05-13 03:28:39,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +27: [2023-05-13 03:28:39,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +27: [2023-05-13 03:28:39,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +13: [2023-05-13 03:28:39,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +13: [2023-05-13 03:28:39,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +13: [2023-05-13 03:28:39,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +30: [2023-05-13 03:28:39,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +13: [2023-05-13 03:28:39,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +13: [2023-05-13 03:28:39,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +21: [2023-05-13 03:28:39,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +13: [2023-05-13 03:28:39,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 7: [2023-05-13 03:28:39,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +13: [2023-05-13 03:28:39,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 7: [2023-05-13 03:28:39,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +30: [2023-05-13 03:28:39,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 7: [2023-05-13 03:28:39,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +27: [2023-05-13 03:28:39,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +27: [2023-05-13 03:28:39,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +13: [2023-05-13 03:28:39,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +13: [2023-05-13 03:28:39,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +13: [2023-05-13 03:28:39,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +13: [2023-05-13 03:28:39,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +13: [2023-05-13 03:28:39,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +13: [2023-05-13 03:28:39,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +13: [2023-05-13 03:28:39,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +13: [2023-05-13 03:28:39,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +13: [2023-05-13 03:28:39,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +13: [2023-05-13 03:28:39,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +13: [2023-05-13 03:28:39,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +13: [2023-05-13 03:28:39,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +30: [2023-05-13 03:28:39,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +21: [2023-05-13 03:28:39,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +21: [2023-05-13 03:28:39,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +28: [2023-05-13 03:28:39,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +28: [2023-05-13 03:28:39,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +28: [2023-05-13 03:28:39,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +29: [2023-05-13 03:28:39,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +29: [2023-05-13 03:28:39,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +29: [2023-05-13 03:28:39,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +29: [2023-05-13 03:28:39,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +29: [2023-05-13 03:28:39,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +29: [2023-05-13 03:28:39,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +29: [2023-05-13 03:28:39,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +29: [2023-05-13 03:28:39,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +28: [2023-05-13 03:28:39,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +28: [2023-05-13 03:28:39,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +28: [2023-05-13 03:28:39,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +21: [2023-05-13 03:28:39,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +28: [2023-05-13 03:28:39,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +28: [2023-05-13 03:28:39,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +28: [2023-05-13 03:28:39,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +28: [2023-05-13 03:28:39,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +29: [2023-05-13 03:28:39,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +28: [2023-05-13 03:28:39,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +28: [2023-05-13 03:28:39,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +30: [2023-05-13 03:28:39,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +30: [2023-05-13 03:28:39,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +30: [2023-05-13 03:28:39,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +29: [2023-05-13 03:28:39,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +28: [2023-05-13 03:28:39,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +28: [2023-05-13 03:28:39,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +28: [2023-05-13 03:28:39,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +28: [2023-05-13 03:28:39,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +28: [2023-05-13 03:28:39,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +28: [2023-05-13 03:28:39,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +28: [2023-05-13 03:28:39,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +28: [2023-05-13 03:28:39,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +28: [2023-05-13 03:28:39,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +28: [2023-05-13 03:28:39,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +28: [2023-05-13 03:28:39,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +28: [2023-05-13 03:28:39,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +28: [2023-05-13 03:28:39,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +28: [2023-05-13 03:28:39,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +28: [2023-05-13 03:28:39,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +28: [2023-05-13 03:28:39,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +29: [2023-05-13 03:28:39,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +21: [2023-05-13 03:28:39,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +30: [2023-05-13 03:28:39,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +21: [2023-05-13 03:28:39,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +21: [2023-05-13 03:28:39,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +29: [2023-05-13 03:28:39,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +29: [2023-05-13 03:28:39,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +29: [2023-05-13 03:28:39,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +29: [2023-05-13 03:28:39,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +29: [2023-05-13 03:28:39,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +30: [2023-05-13 03:28:39,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +21: [2023-05-13 03:28:39,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +21: [2023-05-13 03:28:39,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +21: [2023-05-13 03:28:39,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +21: [2023-05-13 03:28:39,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +27: [2023-05-13 03:28:39,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +27: [2023-05-13 03:28:39,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +27: [2023-05-13 03:28:39,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +30: [2023-05-13 03:28:39,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +21: [2023-05-13 03:28:39,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +30: [2023-05-13 03:28:39,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +30: [2023-05-13 03:28:39,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +30: [2023-05-13 03:28:39,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +30: [2023-05-13 03:28:39,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +30: [2023-05-13 03:28:39,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +30: [2023-05-13 03:28:39,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +30: [2023-05-13 03:28:39,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +30: [2023-05-13 03:28:39,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +30: [2023-05-13 03:28:39,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +30: [2023-05-13 03:28:39,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +30: [2023-05-13 03:28:39,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +30: [2023-05-13 03:28:39,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +30: [2023-05-13 03:28:39,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:39,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +27: [2023-05-13 03:28:39,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +27: [2023-05-13 03:28:39,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +20: [2023-05-13 03:28:39,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:39,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +27: [2023-05-13 03:28:39,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +27: [2023-05-13 03:28:39,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:39,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +27: [2023-05-13 03:28:39,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +27: [2023-05-13 03:28:39,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +27: [2023-05-13 03:28:39,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +27: [2023-05-13 03:28:39,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +27: [2023-05-13 03:28:39,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +21: [2023-05-13 03:28:39,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +27: [2023-05-13 03:28:39,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +27: [2023-05-13 03:28:39,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +27: [2023-05-13 03:28:39,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +27: [2023-05-13 03:28:39,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +21: [2023-05-13 03:28:39,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +21: [2023-05-13 03:28:39,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +21: [2023-05-13 03:28:39,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +21: [2023-05-13 03:28:39,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +21: [2023-05-13 03:28:39,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +21: [2023-05-13 03:28:39,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +21: [2023-05-13 03:28:39,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +30: [2023-05-13 03:28:39,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +21: [2023-05-13 03:28:39,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +30: [2023-05-13 03:28:39,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +30: [2023-05-13 03:28:39,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +21: [2023-05-13 03:28:39,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +21: [2023-05-13 03:28:39,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +30: [2023-05-13 03:28:39,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +21: [2023-05-13 03:28:39,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +30: [2023-05-13 03:28:39,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +30: [2023-05-13 03:28:39,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +30: [2023-05-13 03:28:39,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +30: [2023-05-13 03:28:39,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +30: [2023-05-13 03:28:39,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +30: [2023-05-13 03:28:39,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +28: [2023-05-13 03:28:39,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt... +30: [2023-05-13 03:28:39,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +28: [2023-05-13 03:28:39,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt... +30: [2023-05-13 03:28:39,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +28: [2023-05-13 03:28:39,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt... +28: [2023-05-13 03:28:39,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt... +28: [2023-05-13 03:28:39,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt... +28: [2023-05-13 03:28:39,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt... +30: [2023-05-13 03:28:39,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +30: [2023-05-13 03:28:39,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +30: [2023-05-13 03:28:39,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +30: [2023-05-13 03:28:39,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +21: [2023-05-13 03:28:39,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +21: [2023-05-13 03:28:39,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +21: [2023-05-13 03:28:39,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +21: [2023-05-13 03:28:39,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +20: [2023-05-13 03:28:39,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +21: [2023-05-13 03:28:39,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 0: [2023-05-13 03:28:39,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +21: [2023-05-13 03:28:39,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +21: [2023-05-13 03:28:39,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 0: [2023-05-13 03:28:39,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +14: [2023-05-13 03:28:39,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt... +21: [2023-05-13 03:28:39,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +14: [2023-05-13 03:28:39,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt... +14: [2023-05-13 03:28:39,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt... +14: [2023-05-13 03:28:39,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt... +14: [2023-05-13 03:28:39,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt... +14: [2023-05-13 03:28:39,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt... +14: [2023-05-13 03:28:39,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt... +14: [2023-05-13 03:28:39,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt... +21: [2023-05-13 03:28:39,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +21: [2023-05-13 03:28:39,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +21: [2023-05-13 03:28:39,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +21: [2023-05-13 03:28:39,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +21: [2023-05-13 03:28:39,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +21: [2023-05-13 03:28:39,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +21: [2023-05-13 03:28:39,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +21: [2023-05-13 03:28:39,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +20: [2023-05-13 03:28:39,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +20: [2023-05-13 03:28:39,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:39,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +29: [2023-05-13 03:28:39,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +20: [2023-05-13 03:28:39,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +27: [2023-05-13 03:28:39,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +27: [2023-05-13 03:28:39,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +27: [2023-05-13 03:28:39,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +27: [2023-05-13 03:28:39,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +20: [2023-05-13 03:28:39,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +20: [2023-05-13 03:28:39,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +20: [2023-05-13 03:28:39,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_35-model_00-model_states.pt. +27: [2023-05-13 03:28:39,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +27: [2023-05-13 03:28:39,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +27: [2023-05-13 03:28:39,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 0: [2023-05-13 03:28:39,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 0: [2023-05-13 03:28:39,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 0: [2023-05-13 03:28:39,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 0: [2023-05-13 03:28:39,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 0: [2023-05-13 03:28:39,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +27: [2023-05-13 03:28:39,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +27: [2023-05-13 03:28:39,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +27: [2023-05-13 03:28:39,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +27: [2023-05-13 03:28:39,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +19: [2023-05-13 03:28:39,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +19: [2023-05-13 03:28:39,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +19: [2023-05-13 03:28:39,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +19: [2023-05-13 03:28:39,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +19: [2023-05-13 03:28:39,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +19: [2023-05-13 03:28:39,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +19: [2023-05-13 03:28:39,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +19: [2023-05-13 03:28:39,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +29: [2023-05-13 03:28:39,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +27: [2023-05-13 03:28:39,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt... +27: [2023-05-13 03:28:39,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt... +27: [2023-05-13 03:28:39,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt... +27: [2023-05-13 03:28:39,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt... +27: [2023-05-13 03:28:39,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt... +27: [2023-05-13 03:28:39,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt... +27: [2023-05-13 03:28:39,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt... + 7: [2023-05-13 03:28:39,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt... + 7: [2023-05-13 03:28:39,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt... + 7: [2023-05-13 03:28:39,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt... + 7: [2023-05-13 03:28:39,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt... + 7: [2023-05-13 03:28:39,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt... + 7: [2023-05-13 03:28:39,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt... + 7: [2023-05-13 03:28:39,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt... + 7: [2023-05-13 03:28:39,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt... + 6: [2023-05-13 03:28:39,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +27: [2023-05-13 03:28:39,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt... +19: [2023-05-13 03:28:39,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +19: [2023-05-13 03:28:39,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +19: [2023-05-13 03:28:39,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +13: [2023-05-13 03:28:39,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt... +13: [2023-05-13 03:28:39,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt... +13: [2023-05-13 03:28:39,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt... +19: [2023-05-13 03:28:39,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +13: [2023-05-13 03:28:39,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt... +13: [2023-05-13 03:28:39,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt... +13: [2023-05-13 03:28:39,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt... +13: [2023-05-13 03:28:39,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt... +13: [2023-05-13 03:28:39,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt... + 1: [2023-05-13 03:28:39,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +19: [2023-05-13 03:28:39,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +19: [2023-05-13 03:28:39,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +19: [2023-05-13 03:28:39,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +29: [2023-05-13 03:28:39,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +19: [2023-05-13 03:28:39,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +20: [2023-05-13 03:28:39,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +29: [2023-05-13 03:28:39,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +11: [2023-05-13 03:28:39,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +11: [2023-05-13 03:28:39,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +11: [2023-05-13 03:28:39,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +11: [2023-05-13 03:28:39,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +11: [2023-05-13 03:28:39,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +11: [2023-05-13 03:28:39,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +11: [2023-05-13 03:28:39,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +28: [2023-05-13 03:28:39,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt... +28: [2023-05-13 03:28:39,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt... +11: [2023-05-13 03:28:39,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +29: [2023-05-13 03:28:39,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +29: [2023-05-13 03:28:39,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +29: [2023-05-13 03:28:39,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +11: [2023-05-13 03:28:39,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +29: [2023-05-13 03:28:39,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +29: [2023-05-13 03:28:39,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +29: [2023-05-13 03:28:39,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +29: [2023-05-13 03:28:39,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +20: [2023-05-13 03:28:39,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +20: [2023-05-13 03:28:39,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +29: [2023-05-13 03:28:39,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +20: [2023-05-13 03:28:39,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +29: [2023-05-13 03:28:39,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +29: [2023-05-13 03:28:39,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +29: [2023-05-13 03:28:39,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +29: [2023-05-13 03:28:39,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +11: [2023-05-13 03:28:39,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 1: [2023-05-13 03:28:39,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +16: [2023-05-13 03:28:39,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +16: [2023-05-13 03:28:39,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +11: [2023-05-13 03:28:39,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +11: [2023-05-13 03:28:39,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +11: [2023-05-13 03:28:39,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +11: [2023-05-13 03:28:39,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +11: [2023-05-13 03:28:39,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:39,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +16: [2023-05-13 03:28:39,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +16: [2023-05-13 03:28:39,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +16: [2023-05-13 03:28:39,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +16: [2023-05-13 03:28:39,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +11: [2023-05-13 03:28:39,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:39,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +29: [2023-05-13 03:28:39,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +29: [2023-05-13 03:28:39,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +29: [2023-05-13 03:28:39,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +29: [2023-05-13 03:28:39,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +16: [2023-05-13 03:28:39,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:39,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:39,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +30: [2023-05-13 03:28:39,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt... +30: [2023-05-13 03:28:39,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt... +30: [2023-05-13 03:28:39,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt... +30: [2023-05-13 03:28:39,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt... +30: [2023-05-13 03:28:39,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt... +30: [2023-05-13 03:28:39,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt... +30: [2023-05-13 03:28:39,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt... +30: [2023-05-13 03:28:39,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt... +16: [2023-05-13 03:28:39,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:39,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 0: [2023-05-13 03:28:39,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +16: [2023-05-13 03:28:39,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:39,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:39,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +21: [2023-05-13 03:28:39,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt... +21: [2023-05-13 03:28:39,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt... +21: [2023-05-13 03:28:39,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt... +21: [2023-05-13 03:28:39,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt... +21: [2023-05-13 03:28:39,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt... +21: [2023-05-13 03:28:39,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt... +21: [2023-05-13 03:28:39,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt... +21: [2023-05-13 03:28:39,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt... + 6: [2023-05-13 03:28:39,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +22: [2023-05-13 03:28:39,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +22: [2023-05-13 03:28:39,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +22: [2023-05-13 03:28:39,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +22: [2023-05-13 03:28:39,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +22: [2023-05-13 03:28:39,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +22: [2023-05-13 03:28:39,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +22: [2023-05-13 03:28:39,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +22: [2023-05-13 03:28:39,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 2: [2023-05-13 03:28:39,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +26: [2023-05-13 03:28:39,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +26: [2023-05-13 03:28:39,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +26: [2023-05-13 03:28:39,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +26: [2023-05-13 03:28:39,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +26: [2023-05-13 03:28:39,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +26: [2023-05-13 03:28:39,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +26: [2023-05-13 03:28:39,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +26: [2023-05-13 03:28:39,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +22: [2023-05-13 03:28:39,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +31: [2023-05-13 03:28:39,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +31: [2023-05-13 03:28:39,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +31: [2023-05-13 03:28:39,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +31: [2023-05-13 03:28:39,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +31: [2023-05-13 03:28:39,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +31: [2023-05-13 03:28:39,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +31: [2023-05-13 03:28:39,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +31: [2023-05-13 03:28:39,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +22: [2023-05-13 03:28:39,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 2: [2023-05-13 03:28:39,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +26: [2023-05-13 03:28:39,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +26: [2023-05-13 03:28:39,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +19: [2023-05-13 03:28:39,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +31: [2023-05-13 03:28:39,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +29: [2023-05-13 03:28:39,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +31: [2023-05-13 03:28:39,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +26: [2023-05-13 03:28:39,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +29: [2023-05-13 03:28:39,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +29: [2023-05-13 03:28:39,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +29: [2023-05-13 03:28:39,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +29: [2023-05-13 03:28:39,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +29: [2023-05-13 03:28:39,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +29: [2023-05-13 03:28:39,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +29: [2023-05-13 03:28:39,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +29: [2023-05-13 03:28:39,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +29: [2023-05-13 03:28:39,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +29: [2023-05-13 03:28:39,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +29: [2023-05-13 03:28:39,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +22: [2023-05-13 03:28:39,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 2: [2023-05-13 03:28:39,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +22: [2023-05-13 03:28:39,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +22: [2023-05-13 03:28:39,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +22: [2023-05-13 03:28:39,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +22: [2023-05-13 03:28:39,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +26: [2023-05-13 03:28:39,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +26: [2023-05-13 03:28:39,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +29: [2023-05-13 03:28:39,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +29: [2023-05-13 03:28:39,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +29: [2023-05-13 03:28:39,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +29: [2023-05-13 03:28:39,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 2: [2023-05-13 03:28:39,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 2: [2023-05-13 03:28:39,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +26: [2023-05-13 03:28:39,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +19: [2023-05-13 03:28:39,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +19: [2023-05-13 03:28:39,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +26: [2023-05-13 03:28:39,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +22: [2023-05-13 03:28:39,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +29: [2023-05-13 03:28:39,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +29: [2023-05-13 03:28:39,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +29: [2023-05-13 03:28:39,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +19: [2023-05-13 03:28:39,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 2: [2023-05-13 03:28:39,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +29: [2023-05-13 03:28:39,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +26: [2023-05-13 03:28:39,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 2: [2023-05-13 03:28:39,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +31: [2023-05-13 03:28:39,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +31: [2023-05-13 03:28:39,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +31: [2023-05-13 03:28:39,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +31: [2023-05-13 03:28:39,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +31: [2023-05-13 03:28:39,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +31: [2023-05-13 03:28:39,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 5: [2023-05-13 03:28:39,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 5: [2023-05-13 03:28:39,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 5: [2023-05-13 03:28:39,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 5: [2023-05-13 03:28:39,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 0: [2023-05-13 03:28:39,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +11: [2023-05-13 03:28:39,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 0: [2023-05-13 03:28:39,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 5: [2023-05-13 03:28:39,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 0: [2023-05-13 03:28:39,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +25: [2023-05-13 03:28:39,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +25: [2023-05-13 03:28:39,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +25: [2023-05-13 03:28:39,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +25: [2023-05-13 03:28:39,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +18: [2023-05-13 03:28:39,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +25: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +25: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +25: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +18: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +18: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +18: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +18: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +18: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +18: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +25: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +23: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +23: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +18: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +23: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +19: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +23: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +19: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +19: [2023-05-13 03:28:39,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +23: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +23: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +23: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +24: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +24: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +24: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +24: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +24: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +19: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +23: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +24: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +24: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +24: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 9: [2023-05-13 03:28:39,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +25: [2023-05-13 03:28:39,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +25: [2023-05-13 03:28:39,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +18: [2023-05-13 03:28:39,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +23: [2023-05-13 03:28:39,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +18: [2023-05-13 03:28:39,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +25: [2023-05-13 03:28:39,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +18: [2023-05-13 03:28:39,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +23: [2023-05-13 03:28:39,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +25: [2023-05-13 03:28:39,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +24: [2023-05-13 03:28:39,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +24: [2023-05-13 03:28:39,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 8: [2023-05-13 03:28:39,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 8: [2023-05-13 03:28:39,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +24: [2023-05-13 03:28:39,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +24: [2023-05-13 03:28:39,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +24: [2023-05-13 03:28:39,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +18: [2023-05-13 03:28:39,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +25: [2023-05-13 03:28:39,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +18: [2023-05-13 03:28:39,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +24: [2023-05-13 03:28:39,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +18: [2023-05-13 03:28:39,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +25: [2023-05-13 03:28:39,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +25: [2023-05-13 03:28:39,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +24: [2023-05-13 03:28:39,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +18: [2023-05-13 03:28:39,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +25: [2023-05-13 03:28:39,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +24: [2023-05-13 03:28:39,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +23: [2023-05-13 03:28:39,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +18: [2023-05-13 03:28:39,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 8: [2023-05-13 03:28:39,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +23: [2023-05-13 03:28:39,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +23: [2023-05-13 03:28:39,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +23: [2023-05-13 03:28:39,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +19: [2023-05-13 03:28:39,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +23: [2023-05-13 03:28:39,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +23: [2023-05-13 03:28:39,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 8: [2023-05-13 03:28:39,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 8: [2023-05-13 03:28:39,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 8: [2023-05-13 03:28:39,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +11: [2023-05-13 03:28:39,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +19: [2023-05-13 03:28:39,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +19: [2023-05-13 03:28:39,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +11: [2023-05-13 03:28:39,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +16: [2023-05-13 03:28:39,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +16: [2023-05-13 03:28:39,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +16: [2023-05-13 03:28:39,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +11: [2023-05-13 03:28:39,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +11: [2023-05-13 03:28:39,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +19: [2023-05-13 03:28:39,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +19: [2023-05-13 03:28:39,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +19: [2023-05-13 03:28:39,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +19: [2023-05-13 03:28:39,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +19: [2023-05-13 03:28:39,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +19: [2023-05-13 03:28:39,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +19: [2023-05-13 03:28:39,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +19: [2023-05-13 03:28:39,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +19: [2023-05-13 03:28:39,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +19: [2023-05-13 03:28:39,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +19: [2023-05-13 03:28:39,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +19: [2023-05-13 03:28:39,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 1: [2023-05-13 03:28:39,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt... + 1: [2023-05-13 03:28:39,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt... + 1: [2023-05-13 03:28:39,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt... + 1: [2023-05-13 03:28:39,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt... + 1: [2023-05-13 03:28:39,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt... + 1: [2023-05-13 03:28:39,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt... + 1: [2023-05-13 03:28:39,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt... + 1: [2023-05-13 03:28:39,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt... +11: [2023-05-13 03:28:39,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +19: [2023-05-13 03:28:39,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +16: [2023-05-13 03:28:39,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +16: [2023-05-13 03:28:39,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +16: [2023-05-13 03:28:39,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +16: [2023-05-13 03:28:39,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +16: [2023-05-13 03:28:39,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +22: [2023-05-13 03:28:39,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +17: [2023-05-13 03:28:39,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +11: [2023-05-13 03:28:39,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +11: [2023-05-13 03:28:39,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +11: [2023-05-13 03:28:39,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +17: [2023-05-13 03:28:39,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +17: [2023-05-13 03:28:39,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +17: [2023-05-13 03:28:39,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +17: [2023-05-13 03:28:39,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +17: [2023-05-13 03:28:39,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +17: [2023-05-13 03:28:39,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +17: [2023-05-13 03:28:39,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +19: [2023-05-13 03:28:39,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 0: [2023-05-13 03:28:39,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +26: [2023-05-13 03:28:39,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +26: [2023-05-13 03:28:39,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +19: [2023-05-13 03:28:39,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +19: [2023-05-13 03:28:39,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +17: [2023-05-13 03:28:39,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +19: [2023-05-13 03:28:39,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +19: [2023-05-13 03:28:39,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +19: [2023-05-13 03:28:39,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +19: [2023-05-13 03:28:39,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +19: [2023-05-13 03:28:39,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 0: [2023-05-13 03:28:39,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +19: [2023-05-13 03:28:39,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +19: [2023-05-13 03:28:39,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +19: [2023-05-13 03:28:39,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +19: [2023-05-13 03:28:39,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 0: [2023-05-13 03:28:39,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +19: [2023-05-13 03:28:39,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +19: [2023-05-13 03:28:39,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +19: [2023-05-13 03:28:39,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +19: [2023-05-13 03:28:39,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 0: [2023-05-13 03:28:39,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 2: [2023-05-13 03:28:39,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +31: [2023-05-13 03:28:39,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +31: [2023-05-13 03:28:39,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +29: [2023-05-13 03:28:39,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt... +29: [2023-05-13 03:28:39,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt... +29: [2023-05-13 03:28:39,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt... +29: [2023-05-13 03:28:39,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt... +29: [2023-05-13 03:28:39,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt... +29: [2023-05-13 03:28:39,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt... +29: [2023-05-13 03:28:39,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt... +29: [2023-05-13 03:28:39,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt... + 0: [2023-05-13 03:28:39,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +11: [2023-05-13 03:28:39,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +11: [2023-05-13 03:28:39,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +11: [2023-05-13 03:28:39,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 0: [2023-05-13 03:28:39,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 0: [2023-05-13 03:28:39,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 0: [2023-05-13 03:28:39,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 0: [2023-05-13 03:28:39,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 0: [2023-05-13 03:28:39,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 9: [2023-05-13 03:28:39,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt... + 9: [2023-05-13 03:28:39,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt... + 9: [2023-05-13 03:28:39,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt... + 9: [2023-05-13 03:28:39,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt... + 9: [2023-05-13 03:28:39,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt... + 9: [2023-05-13 03:28:39,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt... + 9: [2023-05-13 03:28:39,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt... + 9: [2023-05-13 03:28:39,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt... +22: [2023-05-13 03:28:39,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 6: [2023-05-13 03:28:39,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt... + 6: [2023-05-13 03:28:39,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt... + 6: [2023-05-13 03:28:39,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt... + 6: [2023-05-13 03:28:39,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt... + 6: [2023-05-13 03:28:39,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt... + 6: [2023-05-13 03:28:39,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt... +17: [2023-05-13 03:28:39,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +17: [2023-05-13 03:28:39,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +17: [2023-05-13 03:28:39,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +17: [2023-05-13 03:28:39,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +17: [2023-05-13 03:28:39,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +17: [2023-05-13 03:28:39,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:39,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 2: [2023-05-13 03:28:39,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +26: [2023-05-13 03:28:39,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +17: [2023-05-13 03:28:39,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:39,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +16: [2023-05-13 03:28:39,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 0: > overriding learning rate value to 0.0002 + 0: > overriding minimum learning rate value to 2e-05 + 0: > overriding warmup iterations value to 0 + 0: > overriding total number of iterations value to 1 + 0: > overriding decay style value to cosine +12: [2023-05-13 03:28:39,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +12: [2023-05-13 03:28:39,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +26: [2023-05-13 03:28:39,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +23: [2023-05-13 03:28:39,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +12: [2023-05-13 03:28:39,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +12: [2023-05-13 03:28:39,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +12: [2023-05-13 03:28:39,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +12: [2023-05-13 03:28:39,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +12: [2023-05-13 03:28:39,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +12: [2023-05-13 03:28:39,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +22: [2023-05-13 03:28:39,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +11: [2023-05-13 03:28:39,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +25: [2023-05-13 03:28:39,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +25: [2023-05-13 03:28:39,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +11: [2023-05-13 03:28:39,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +24: [2023-05-13 03:28:39,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +11: [2023-05-13 03:28:39,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +11: [2023-05-13 03:28:39,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +16: [2023-05-13 03:28:39,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +16: [2023-05-13 03:28:39,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +16: [2023-05-13 03:28:39,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +16: [2023-05-13 03:28:39,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +16: [2023-05-13 03:28:39,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +16: [2023-05-13 03:28:39,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +12: [2023-05-13 03:28:39,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +26: [2023-05-13 03:28:39,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +16: [2023-05-13 03:28:39,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +22: [2023-05-13 03:28:39,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +16: [2023-05-13 03:28:39,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +22: [2023-05-13 03:28:39,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +26: [2023-05-13 03:28:39,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +22: [2023-05-13 03:28:39,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +12: [2023-05-13 03:28:39,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 8: [2023-05-13 03:28:39,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +31: [2023-05-13 03:28:39,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +16: [2023-05-13 03:28:39,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +16: [2023-05-13 03:28:39,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +16: [2023-05-13 03:28:39,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +16: [2023-05-13 03:28:39,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +16: [2023-05-13 03:28:39,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +16: [2023-05-13 03:28:39,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +16: [2023-05-13 03:28:39,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +16: [2023-05-13 03:28:39,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +12: [2023-05-13 03:28:39,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +31: [2023-05-13 03:28:39,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +16: [2023-05-13 03:28:39,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +22: [2023-05-13 03:28:39,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +22: [2023-05-13 03:28:39,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +26: [2023-05-13 03:28:39,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +26: [2023-05-13 03:28:39,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +26: [2023-05-13 03:28:39,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +12: [2023-05-13 03:28:39,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:39,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 2: [2023-05-13 03:28:39,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +12: [2023-05-13 03:28:39,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +16: [2023-05-13 03:28:39,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +16: [2023-05-13 03:28:39,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +18: [2023-05-13 03:28:39,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +18: [2023-05-13 03:28:39,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +18: [2023-05-13 03:28:39,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +26: [2023-05-13 03:28:39,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +26: [2023-05-13 03:28:39,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 5: [2023-05-13 03:28:39,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +12: [2023-05-13 03:28:39,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +26: [2023-05-13 03:28:39,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +26: [2023-05-13 03:28:39,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +16: [2023-05-13 03:28:39,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +12: [2023-05-13 03:28:39,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +26: [2023-05-13 03:28:39,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +26: [2023-05-13 03:28:39,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +31: [2023-05-13 03:28:39,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +31: [2023-05-13 03:28:39,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +31: [2023-05-13 03:28:39,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +31: [2023-05-13 03:28:39,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +26: [2023-05-13 03:28:39,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +16: [2023-05-13 03:28:39,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +16: [2023-05-13 03:28:39,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +31: [2023-05-13 03:28:39,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +12: [2023-05-13 03:28:39,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 2: [2023-05-13 03:28:39,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +31: [2023-05-13 03:28:39,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +16: [2023-05-13 03:28:39,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +16: [2023-05-13 03:28:39,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +16: [2023-05-13 03:28:39,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +16: [2023-05-13 03:28:39,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +16: [2023-05-13 03:28:39,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +16: [2023-05-13 03:28:39,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +23: [2023-05-13 03:28:39,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +31: [2023-05-13 03:28:39,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +31: [2023-05-13 03:28:39,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +31: [2023-05-13 03:28:39,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +24: [2023-05-13 03:28:39,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +22: [2023-05-13 03:28:39,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +22: [2023-05-13 03:28:39,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +22: [2023-05-13 03:28:39,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +22: [2023-05-13 03:28:39,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +22: [2023-05-13 03:28:39,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +11: [2023-05-13 03:28:39,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +22: [2023-05-13 03:28:39,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +22: [2023-05-13 03:28:39,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +11: [2023-05-13 03:28:39,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +11: [2023-05-13 03:28:39,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +22: [2023-05-13 03:28:39,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +11: [2023-05-13 03:28:39,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +31: [2023-05-13 03:28:39,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +31: [2023-05-13 03:28:39,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +31: [2023-05-13 03:28:39,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +11: [2023-05-13 03:28:39,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +11: [2023-05-13 03:28:39,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 2: [2023-05-13 03:28:39,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +11: [2023-05-13 03:28:39,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +11: [2023-05-13 03:28:39,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +11: [2023-05-13 03:28:39,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +11: [2023-05-13 03:28:39,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +11: [2023-05-13 03:28:39,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +11: [2023-05-13 03:28:39,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +25: [2023-05-13 03:28:39,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +24: [2023-05-13 03:28:39,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +24: [2023-05-13 03:28:39,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +11: [2023-05-13 03:28:39,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +25: [2023-05-13 03:28:39,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +11: [2023-05-13 03:28:39,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +11: [2023-05-13 03:28:39,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +11: [2023-05-13 03:28:39,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +11: [2023-05-13 03:28:39,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +18: [2023-05-13 03:28:39,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +11: [2023-05-13 03:28:39,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +11: [2023-05-13 03:28:39,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +11: [2023-05-13 03:28:39,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +26: [2023-05-13 03:28:39,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 2: [2023-05-13 03:28:39,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +26: [2023-05-13 03:28:39,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +26: [2023-05-13 03:28:39,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 2: [2023-05-13 03:28:39,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +26: [2023-05-13 03:28:39,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +11: [2023-05-13 03:28:39,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +11: [2023-05-13 03:28:39,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +11: [2023-05-13 03:28:39,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +11: [2023-05-13 03:28:39,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +25: [2023-05-13 03:28:39,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +23: [2023-05-13 03:28:39,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 8: [2023-05-13 03:28:39,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +18: [2023-05-13 03:28:39,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +18: [2023-05-13 03:28:39,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +18: [2023-05-13 03:28:39,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +18: [2023-05-13 03:28:39,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +25: [2023-05-13 03:28:39,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +25: [2023-05-13 03:28:39,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 5: [2023-05-13 03:28:39,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +26: [2023-05-13 03:28:39,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +24: [2023-05-13 03:28:39,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +25: [2023-05-13 03:28:39,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +25: [2023-05-13 03:28:39,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +25: [2023-05-13 03:28:39,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +26: [2023-05-13 03:28:39,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +26: [2023-05-13 03:28:39,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +23: [2023-05-13 03:28:39,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +23: [2023-05-13 03:28:39,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +23: [2023-05-13 03:28:39,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +26: [2023-05-13 03:28:39,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +23: [2023-05-13 03:28:39,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +23: [2023-05-13 03:28:39,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 5: [2023-05-13 03:28:39,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +25: [2023-05-13 03:28:39,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +25: [2023-05-13 03:28:39,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 5: [2023-05-13 03:28:39,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +25: [2023-05-13 03:28:39,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +25: [2023-05-13 03:28:39,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +24: [2023-05-13 03:28:39,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +24: [2023-05-13 03:28:39,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +24: [2023-05-13 03:28:39,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +24: [2023-05-13 03:28:39,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +17: [2023-05-13 03:28:39,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +25: [2023-05-13 03:28:39,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +25: [2023-05-13 03:28:39,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +24: [2023-05-13 03:28:39,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +24: [2023-05-13 03:28:39,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 8: [2023-05-13 03:28:39,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt... +18: [2023-05-13 03:28:39,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 6: [2023-05-13 03:28:39,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt... +18: [2023-05-13 03:28:39,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +24: [2023-05-13 03:28:39,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +18: [2023-05-13 03:28:39,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +23: [2023-05-13 03:28:39,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +23: [2023-05-13 03:28:39,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +23: [2023-05-13 03:28:39,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +18: [2023-05-13 03:28:39,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +18: [2023-05-13 03:28:39,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +18: [2023-05-13 03:28:39,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +18: [2023-05-13 03:28:39,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +18: [2023-05-13 03:28:39,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +18: [2023-05-13 03:28:39,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +23: [2023-05-13 03:28:39,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +18: [2023-05-13 03:28:39,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +18: [2023-05-13 03:28:39,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +18: [2023-05-13 03:28:39,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +23: [2023-05-13 03:28:39,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +26: [2023-05-13 03:28:39,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +23: [2023-05-13 03:28:39,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 8: [2023-05-13 03:28:39,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +26: [2023-05-13 03:28:39,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +23: [2023-05-13 03:28:39,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 0: [2023-05-13 03:28:39,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt... + 5: [2023-05-13 03:28:39,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 0: [2023-05-13 03:28:39,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt... + 0: [2023-05-13 03:28:39,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt... + 0: [2023-05-13 03:28:39,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt... + 0: [2023-05-13 03:28:39,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt... + 0: [2023-05-13 03:28:39,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt... + 0: [2023-05-13 03:28:39,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt... + 0: [2023-05-13 03:28:39,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt... +26: [2023-05-13 03:28:39,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +26: [2023-05-13 03:28:39,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +26: [2023-05-13 03:28:39,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +26: [2023-05-13 03:28:39,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +26: [2023-05-13 03:28:39,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +22: [2023-05-13 03:28:39,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +22: [2023-05-13 03:28:39,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +24: [2023-05-13 03:28:39,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +26: [2023-05-13 03:28:39,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +26: [2023-05-13 03:28:39,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +26: [2023-05-13 03:28:39,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +26: [2023-05-13 03:28:39,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +22: [2023-05-13 03:28:39,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +24: [2023-05-13 03:28:39,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +22: [2023-05-13 03:28:39,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +24: [2023-05-13 03:28:39,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +22: [2023-05-13 03:28:39,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +22: [2023-05-13 03:28:39,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +26: [2023-05-13 03:28:39,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +22: [2023-05-13 03:28:39,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +24: [2023-05-13 03:28:39,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +22: [2023-05-13 03:28:39,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 5: [2023-05-13 03:28:39,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 5: [2023-05-13 03:28:39,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +23: [2023-05-13 03:28:39,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +26: [2023-05-13 03:28:39,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 5: [2023-05-13 03:28:39,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +26: [2023-05-13 03:28:39,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 5: [2023-05-13 03:28:39,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 5: [2023-05-13 03:28:39,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 5: [2023-05-13 03:28:39,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +26: [2023-05-13 03:28:39,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 5: [2023-05-13 03:28:39,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +25: [2023-05-13 03:28:39,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 5: [2023-05-13 03:28:39,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 5: [2023-05-13 03:28:39,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 5: [2023-05-13 03:28:39,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +26: [2023-05-13 03:28:39,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +25: [2023-05-13 03:28:39,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +25: [2023-05-13 03:28:39,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 5: [2023-05-13 03:28:39,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +25: [2023-05-13 03:28:39,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 5: [2023-05-13 03:28:39,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +15: [2023-05-13 03:28:39,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt. +15: [2023-05-13 03:28:39,317] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 123 + 2: [2023-05-13 03:28:39,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +25: [2023-05-13 03:28:39,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 2: [2023-05-13 03:28:39,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 8: [2023-05-13 03:28:39,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +25: [2023-05-13 03:28:39,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +25: [2023-05-13 03:28:39,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 8: [2023-05-13 03:28:39,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +25: [2023-05-13 03:28:39,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 8: [2023-05-13 03:28:39,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 8: [2023-05-13 03:28:39,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +24: [2023-05-13 03:28:39,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 8: [2023-05-13 03:28:39,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +24: [2023-05-13 03:28:39,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +24: [2023-05-13 03:28:39,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 8: [2023-05-13 03:28:39,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +24: [2023-05-13 03:28:39,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +18: [2023-05-13 03:28:39,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +18: [2023-05-13 03:28:39,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +18: [2023-05-13 03:28:39,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +22: [2023-05-13 03:28:39,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +22: [2023-05-13 03:28:39,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +18: [2023-05-13 03:28:39,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +22: [2023-05-13 03:28:39,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +22: [2023-05-13 03:28:39,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +22: [2023-05-13 03:28:39,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +22: [2023-05-13 03:28:39,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 2: [2023-05-13 03:28:39,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +22: [2023-05-13 03:28:39,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +22: [2023-05-13 03:28:39,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +22: [2023-05-13 03:28:39,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +22: [2023-05-13 03:28:39,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +24: [2023-05-13 03:28:39,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +22: [2023-05-13 03:28:39,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +22: [2023-05-13 03:28:39,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 2: [2023-05-13 03:28:39,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +22: [2023-05-13 03:28:39,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +22: [2023-05-13 03:28:39,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +24: [2023-05-13 03:28:39,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +24: [2023-05-13 03:28:39,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +22: [2023-05-13 03:28:39,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +15: [2023-05-13 03:28:39,323] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 123 +22: [2023-05-13 03:28:39,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +24: [2023-05-13 03:28:39,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 2: [2023-05-13 03:28:39,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 2: [2023-05-13 03:28:39,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 2: [2023-05-13 03:28:39,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +17: [2023-05-13 03:28:39,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 2: [2023-05-13 03:28:39,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +18: [2023-05-13 03:28:39,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +18: [2023-05-13 03:28:39,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +18: [2023-05-13 03:28:39,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +18: [2023-05-13 03:28:39,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +18: [2023-05-13 03:28:39,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +25: [2023-05-13 03:28:39,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +17: [2023-05-13 03:28:39,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +17: [2023-05-13 03:28:39,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +18: [2023-05-13 03:28:39,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +18: [2023-05-13 03:28:39,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +25: [2023-05-13 03:28:39,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +25: [2023-05-13 03:28:39,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +18: [2023-05-13 03:28:39,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +17: [2023-05-13 03:28:39,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +25: [2023-05-13 03:28:39,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +19: [2023-05-13 03:28:39,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt... +19: [2023-05-13 03:28:39,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt... +19: [2023-05-13 03:28:39,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt... +19: [2023-05-13 03:28:39,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt... +19: [2023-05-13 03:28:39,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt... +19: [2023-05-13 03:28:39,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt... +19: [2023-05-13 03:28:39,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt... +19: [2023-05-13 03:28:39,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt... +18: [2023-05-13 03:28:39,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +31: [2023-05-13 03:28:39,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +31: [2023-05-13 03:28:39,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +31: [2023-05-13 03:28:39,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +31: [2023-05-13 03:28:39,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +31: [2023-05-13 03:28:39,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +31: [2023-05-13 03:28:39,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +31: [2023-05-13 03:28:39,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +31: [2023-05-13 03:28:39,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +31: [2023-05-13 03:28:39,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +31: [2023-05-13 03:28:39,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +31: [2023-05-13 03:28:39,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +31: [2023-05-13 03:28:39,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +31: [2023-05-13 03:28:39,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +31: [2023-05-13 03:28:39,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +31: [2023-05-13 03:28:39,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +31: [2023-05-13 03:28:39,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +31: [2023-05-13 03:28:39,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +31: [2023-05-13 03:28:39,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +31: [2023-05-13 03:28:39,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +31: [2023-05-13 03:28:39,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +31: [2023-05-13 03:28:39,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +31: [2023-05-13 03:28:39,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +31: [2023-05-13 03:28:39,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +31: [2023-05-13 03:28:39,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +17: [2023-05-13 03:28:39,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +18: [2023-05-13 03:28:39,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +18: [2023-05-13 03:28:39,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +18: [2023-05-13 03:28:39,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +18: [2023-05-13 03:28:39,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +18: [2023-05-13 03:28:39,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +18: [2023-05-13 03:28:39,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +25: [2023-05-13 03:28:39,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +18: [2023-05-13 03:28:39,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +23: [2023-05-13 03:28:39,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +25: [2023-05-13 03:28:39,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +25: [2023-05-13 03:28:39,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +25: [2023-05-13 03:28:39,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +25: [2023-05-13 03:28:39,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +23: [2023-05-13 03:28:39,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +23: [2023-05-13 03:28:39,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +25: [2023-05-13 03:28:39,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +23: [2023-05-13 03:28:39,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +25: [2023-05-13 03:28:39,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +25: [2023-05-13 03:28:39,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +25: [2023-05-13 03:28:39,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +25: [2023-05-13 03:28:39,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +25: [2023-05-13 03:28:39,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +25: [2023-05-13 03:28:39,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +24: [2023-05-13 03:28:39,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +24: [2023-05-13 03:28:39,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +24: [2023-05-13 03:28:39,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +12: [2023-05-13 03:28:39,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +12: [2023-05-13 03:28:39,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +24: [2023-05-13 03:28:39,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +23: [2023-05-13 03:28:39,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +11: [2023-05-13 03:28:39,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt... +11: [2023-05-13 03:28:39,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt... +11: [2023-05-13 03:28:39,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt... +23: [2023-05-13 03:28:39,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +11: [2023-05-13 03:28:39,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt... +11: [2023-05-13 03:28:39,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt... +11: [2023-05-13 03:28:39,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt... +11: [2023-05-13 03:28:39,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt... +23: [2023-05-13 03:28:39,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +11: [2023-05-13 03:28:39,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt... +23: [2023-05-13 03:28:39,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +12: [2023-05-13 03:28:39,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +24: [2023-05-13 03:28:39,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +24: [2023-05-13 03:28:39,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +24: [2023-05-13 03:28:39,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +24: [2023-05-13 03:28:39,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +24: [2023-05-13 03:28:39,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +24: [2023-05-13 03:28:39,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +24: [2023-05-13 03:28:39,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +24: [2023-05-13 03:28:39,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +24: [2023-05-13 03:28:39,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +24: [2023-05-13 03:28:39,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +24: [2023-05-13 03:28:39,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +24: [2023-05-13 03:28:39,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +23: [2023-05-13 03:28:39,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +23: [2023-05-13 03:28:39,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +23: [2023-05-13 03:28:39,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +23: [2023-05-13 03:28:39,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +23: [2023-05-13 03:28:39,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +23: [2023-05-13 03:28:39,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +23: [2023-05-13 03:28:39,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +23: [2023-05-13 03:28:39,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +23: [2023-05-13 03:28:39,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +12: [2023-05-13 03:28:39,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +23: [2023-05-13 03:28:39,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +23: [2023-05-13 03:28:39,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +23: [2023-05-13 03:28:39,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +15: [2023-05-13 03:28:39,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt. +15: [2023-05-13 03:28:39,344] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 124 + 3: [2023-05-13 03:28:39,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 8: [2023-05-13 03:28:39,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 8: [2023-05-13 03:28:39,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +23: [2023-05-13 03:28:39,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +23: [2023-05-13 03:28:39,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +23: [2023-05-13 03:28:39,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 3: [2023-05-13 03:28:39,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 3: [2023-05-13 03:28:39,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +23: [2023-05-13 03:28:39,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +17: [2023-05-13 03:28:39,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +17: [2023-05-13 03:28:39,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +15: [2023-05-13 03:28:39,350] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 124 + 4: [2023-05-13 03:28:39,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... + 8: [2023-05-13 03:28:39,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +17: [2023-05-13 03:28:39,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +17: [2023-05-13 03:28:39,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +17: [2023-05-13 03:28:39,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +17: [2023-05-13 03:28:39,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 8: [2023-05-13 03:28:39,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 8: [2023-05-13 03:28:39,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 8: [2023-05-13 03:28:39,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +12: [2023-05-13 03:28:39,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +12: [2023-05-13 03:28:39,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +12: [2023-05-13 03:28:39,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +12: [2023-05-13 03:28:39,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +17: [2023-05-13 03:28:39,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +17: [2023-05-13 03:28:39,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +17: [2023-05-13 03:28:39,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +12: [2023-05-13 03:28:39,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +17: [2023-05-13 03:28:39,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +12: [2023-05-13 03:28:39,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +12: [2023-05-13 03:28:39,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +12: [2023-05-13 03:28:39,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +16: [2023-05-13 03:28:39,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt... +16: [2023-05-13 03:28:39,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt... +16: [2023-05-13 03:28:39,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt... +16: [2023-05-13 03:28:39,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt... +16: [2023-05-13 03:28:39,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt... +16: [2023-05-13 03:28:39,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt... +16: [2023-05-13 03:28:39,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt... +16: [2023-05-13 03:28:39,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt... +12: [2023-05-13 03:28:39,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +12: [2023-05-13 03:28:39,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +12: [2023-05-13 03:28:39,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +12: [2023-05-13 03:28:39,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +12: [2023-05-13 03:28:39,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +12: [2023-05-13 03:28:39,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +12: [2023-05-13 03:28:39,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +12: [2023-05-13 03:28:39,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +12: [2023-05-13 03:28:39,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +12: [2023-05-13 03:28:39,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +12: [2023-05-13 03:28:39,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +12: [2023-05-13 03:28:39,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 2: [2023-05-13 03:28:39,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt... + 2: [2023-05-13 03:28:39,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt... + 2: [2023-05-13 03:28:39,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt... + 2: [2023-05-13 03:28:39,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt... + 2: [2023-05-13 03:28:39,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt... + 2: [2023-05-13 03:28:39,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt... + 2: [2023-05-13 03:28:39,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt... + 2: [2023-05-13 03:28:39,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt... +22: [2023-05-13 03:28:39,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt... +22: [2023-05-13 03:28:39,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt... +22: [2023-05-13 03:28:39,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt... +22: [2023-05-13 03:28:39,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt... +22: [2023-05-13 03:28:39,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt... +22: [2023-05-13 03:28:39,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt... +22: [2023-05-13 03:28:39,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt... +22: [2023-05-13 03:28:39,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt... +20: [2023-05-13 03:28:39,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +20: [2023-05-13 03:28:39,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +31: [2023-05-13 03:28:39,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt... +31: [2023-05-13 03:28:39,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt... +31: [2023-05-13 03:28:39,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt... +31: [2023-05-13 03:28:39,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt... +31: [2023-05-13 03:28:39,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt... +31: [2023-05-13 03:28:39,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt... +31: [2023-05-13 03:28:39,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt... +31: [2023-05-13 03:28:39,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt... +20: [2023-05-13 03:28:39,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +20: [2023-05-13 03:28:39,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +20: [2023-05-13 03:28:39,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +20: [2023-05-13 03:28:39,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +20: [2023-05-13 03:28:39,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +20: [2023-05-13 03:28:39,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +20: [2023-05-13 03:28:39,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +12: [2023-05-13 03:28:39,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +26: [2023-05-13 03:28:39,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt... +26: [2023-05-13 03:28:39,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt... +26: [2023-05-13 03:28:39,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt... +26: [2023-05-13 03:28:39,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt... +20: [2023-05-13 03:28:39,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +26: [2023-05-13 03:28:39,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt... +26: [2023-05-13 03:28:39,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt... +26: [2023-05-13 03:28:39,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt... +26: [2023-05-13 03:28:39,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt... +12: [2023-05-13 03:28:39,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +12: [2023-05-13 03:28:39,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +12: [2023-05-13 03:28:39,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +20: [2023-05-13 03:28:39,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +12: [2023-05-13 03:28:39,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +12: [2023-05-13 03:28:39,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +12: [2023-05-13 03:28:39,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +12: [2023-05-13 03:28:39,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +12: [2023-05-13 03:28:39,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +17: [2023-05-13 03:28:39,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +12: [2023-05-13 03:28:39,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +12: [2023-05-13 03:28:39,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +12: [2023-05-13 03:28:39,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +12: [2023-05-13 03:28:39,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +20: [2023-05-13 03:28:39,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +12: [2023-05-13 03:28:39,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +12: [2023-05-13 03:28:39,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +17: [2023-05-13 03:28:39,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +17: [2023-05-13 03:28:39,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +12: [2023-05-13 03:28:39,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +17: [2023-05-13 03:28:39,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +17: [2023-05-13 03:28:39,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +17: [2023-05-13 03:28:39,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +17: [2023-05-13 03:28:39,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +17: [2023-05-13 03:28:39,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +17: [2023-05-13 03:28:39,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +17: [2023-05-13 03:28:39,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +15: [2023-05-13 03:28:39,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt. +17: [2023-05-13 03:28:39,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +17: [2023-05-13 03:28:39,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +15: [2023-05-13 03:28:39,386] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 125 +20: [2023-05-13 03:28:39,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt... +17: [2023-05-13 03:28:39,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +17: [2023-05-13 03:28:39,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +17: [2023-05-13 03:28:39,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +17: [2023-05-13 03:28:39,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +17: [2023-05-13 03:28:39,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +17: [2023-05-13 03:28:39,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +15: [2023-05-13 03:28:39,391] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 125 +17: [2023-05-13 03:28:39,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +17: [2023-05-13 03:28:39,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +17: [2023-05-13 03:28:39,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +17: [2023-05-13 03:28:39,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +17: [2023-05-13 03:28:39,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +17: [2023-05-13 03:28:39,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +25: [2023-05-13 03:28:39,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt... +25: [2023-05-13 03:28:39,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt... +25: [2023-05-13 03:28:39,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt... +25: [2023-05-13 03:28:39,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt... +25: [2023-05-13 03:28:39,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt... +25: [2023-05-13 03:28:39,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt... +25: [2023-05-13 03:28:39,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt... +25: [2023-05-13 03:28:39,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt... +23: [2023-05-13 03:28:39,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt... +23: [2023-05-13 03:28:39,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt... +23: [2023-05-13 03:28:39,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt... +23: [2023-05-13 03:28:39,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt... +23: [2023-05-13 03:28:39,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt... +23: [2023-05-13 03:28:39,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt... +23: [2023-05-13 03:28:39,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt... +23: [2023-05-13 03:28:39,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt... +18: [2023-05-13 03:28:39,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt... +18: [2023-05-13 03:28:39,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt... +18: [2023-05-13 03:28:39,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt... +18: [2023-05-13 03:28:39,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt... +18: [2023-05-13 03:28:39,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt... +18: [2023-05-13 03:28:39,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt... +18: [2023-05-13 03:28:39,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt... +18: [2023-05-13 03:28:39,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt... + 5: [2023-05-13 03:28:39,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt... + 5: [2023-05-13 03:28:39,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt... + 5: [2023-05-13 03:28:39,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt... + 5: [2023-05-13 03:28:39,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt... + 5: [2023-05-13 03:28:39,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt... + 5: [2023-05-13 03:28:39,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt... + 5: [2023-05-13 03:28:39,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt... + 5: [2023-05-13 03:28:39,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt... + 3: [2023-05-13 03:28:39,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt... + 3: [2023-05-13 03:28:39,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt... + 3: [2023-05-13 03:28:39,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt... + 3: [2023-05-13 03:28:39,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt... + 3: [2023-05-13 03:28:39,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt... + 3: [2023-05-13 03:28:39,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt... + 4: [2023-05-13 03:28:39,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 8: [2023-05-13 03:28:39,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt... + 8: [2023-05-13 03:28:39,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt... + 8: [2023-05-13 03:28:39,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt... + 8: [2023-05-13 03:28:39,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt... + 8: [2023-05-13 03:28:39,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt... + 8: [2023-05-13 03:28:39,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt... + 8: [2023-05-13 03:28:39,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt... + 8: [2023-05-13 03:28:39,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt... + 4: [2023-05-13 03:28:39,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +24: [2023-05-13 03:28:39,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt... +24: [2023-05-13 03:28:39,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt... +24: [2023-05-13 03:28:39,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt... +24: [2023-05-13 03:28:39,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt... +24: [2023-05-13 03:28:39,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt... +24: [2023-05-13 03:28:39,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt... +24: [2023-05-13 03:28:39,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt... +24: [2023-05-13 03:28:39,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt... +17: [2023-05-13 03:28:39,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt... +17: [2023-05-13 03:28:39,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt... +17: [2023-05-13 03:28:39,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt... +17: [2023-05-13 03:28:39,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt... +17: [2023-05-13 03:28:39,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt... +17: [2023-05-13 03:28:39,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt... +17: [2023-05-13 03:28:39,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt... +17: [2023-05-13 03:28:39,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt... + 4: [2023-05-13 03:28:39,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +10: [2023-05-13 03:28:39,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt. +10: [2023-05-13 03:28:39,431] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 81 +20: [2023-05-13 03:28:39,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +20: [2023-05-13 03:28:39,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +10: [2023-05-13 03:28:39,437] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 81 + 4: [2023-05-13 03:28:39,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +10: [2023-05-13 03:28:39,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt. + 4: [2023-05-13 03:28:39,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +10: [2023-05-13 03:28:39,440] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 80 + 4: [2023-05-13 03:28:39,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +10: [2023-05-13 03:28:39,445] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 80 + 3: [2023-05-13 03:28:39,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt... + 3: [2023-05-13 03:28:39,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt... +12: [2023-05-13 03:28:39,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt... +12: [2023-05-13 03:28:39,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt... +12: [2023-05-13 03:28:39,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt... +12: [2023-05-13 03:28:39,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt... +12: [2023-05-13 03:28:39,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt... +12: [2023-05-13 03:28:39,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt... +12: [2023-05-13 03:28:39,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt... +12: [2023-05-13 03:28:39,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt... +20: [2023-05-13 03:28:39,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +20: [2023-05-13 03:28:39,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +15: [2023-05-13 03:28:39,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt. +15: [2023-05-13 03:28:39,458] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 127 +20: [2023-05-13 03:28:39,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +20: [2023-05-13 03:28:39,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +20: [2023-05-13 03:28:39,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +15: [2023-05-13 03:28:39,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt. +15: [2023-05-13 03:28:39,463] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 126 +20: [2023-05-13 03:28:39,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +20: [2023-05-13 03:28:39,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +20: [2023-05-13 03:28:39,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_36-model_00-model_states.pt. +20: [2023-05-13 03:28:39,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +20: [2023-05-13 03:28:39,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +15: [2023-05-13 03:28:39,465] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 127 +20: [2023-05-13 03:28:39,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +15: [2023-05-13 03:28:39,469] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 126 +15: [2023-05-13 03:28:39,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt. +15: [2023-05-13 03:28:39,470] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 120 +15: [2023-05-13 03:28:39,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt. +15: [2023-05-13 03:28:39,472] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 122 +15: [2023-05-13 03:28:39,476] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 120 +15: [2023-05-13 03:28:39,478] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 122 +20: [2023-05-13 03:28:39,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +20: [2023-05-13 03:28:39,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +20: [2023-05-13 03:28:39,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +20: [2023-05-13 03:28:39,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... + 4: [2023-05-13 03:28:39,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 4: [2023-05-13 03:28:39,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +20: [2023-05-13 03:28:39,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +20: [2023-05-13 03:28:39,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +20: [2023-05-13 03:28:39,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +20: [2023-05-13 03:28:39,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +20: [2023-05-13 03:28:39,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +20: [2023-05-13 03:28:39,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +20: [2023-05-13 03:28:39,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. +20: [2023-05-13 03:28:39,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt... +20: [2023-05-13 03:28:39,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/layer_38-model_00-model_states.pt. + 7: [2023-05-13 03:28:39,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt. + 7: [2023-05-13 03:28:39,514] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 57 +30: [2023-05-13 03:28:39,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt. +30: [2023-05-13 03:28:39,516] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 241 + 7: [2023-05-13 03:28:39,519] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 57 +30: [2023-05-13 03:28:39,522] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 241 + 4: [2023-05-13 03:28:39,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt... + 4: [2023-05-13 03:28:39,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt... + 4: [2023-05-13 03:28:39,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt... + 4: [2023-05-13 03:28:39,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt... + 4: [2023-05-13 03:28:39,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt... + 4: [2023-05-13 03:28:39,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt... + 4: [2023-05-13 03:28:39,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt... + 4: [2023-05-13 03:28:39,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt... +10: [2023-05-13 03:28:39,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt. +10: [2023-05-13 03:28:39,531] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 87 +27: [2023-05-13 03:28:39,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt. +27: [2023-05-13 03:28:39,533] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 221 +10: [2023-05-13 03:28:39,536] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 87 +27: [2023-05-13 03:28:39,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt. +27: [2023-05-13 03:28:39,537] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 220 +27: [2023-05-13 03:28:39,539] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 221 +28: [2023-05-13 03:28:39,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt. +28: [2023-05-13 03:28:39,542] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 224 +27: [2023-05-13 03:28:39,543] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 220 +28: [2023-05-13 03:28:39,548] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 224 +20: [2023-05-13 03:28:39,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt... +20: [2023-05-13 03:28:39,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt... +20: [2023-05-13 03:28:39,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt... +20: [2023-05-13 03:28:39,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt... +20: [2023-05-13 03:28:39,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt... +20: [2023-05-13 03:28:39,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt... +20: [2023-05-13 03:28:39,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt... +20: [2023-05-13 03:28:39,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt... + 7: [2023-05-13 03:28:39,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt. +27: [2023-05-13 03:28:39,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt. + 7: [2023-05-13 03:28:39,550] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 58 +27: [2023-05-13 03:28:39,550] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 219 +28: [2023-05-13 03:28:39,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt. +28: [2023-05-13 03:28:39,553] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 227 + 7: [2023-05-13 03:28:39,556] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 58 +27: [2023-05-13 03:28:39,556] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 219 +28: [2023-05-13 03:28:39,558] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 227 +10: [2023-05-13 03:28:39,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt. +10: [2023-05-13 03:28:39,563] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 83 +28: [2023-05-13 03:28:39,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt. +28: [2023-05-13 03:28:39,566] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 231 +10: [2023-05-13 03:28:39,567] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 83 +28: [2023-05-13 03:28:39,570] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 231 +10: [2023-05-13 03:28:39,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt. +10: [2023-05-13 03:28:39,585] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 82 + 9: [2023-05-13 03:28:39,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt. + 9: [2023-05-13 03:28:39,587] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 79 +10: [2023-05-13 03:28:39,590] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 82 +13: [2023-05-13 03:28:39,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt. +13: [2023-05-13 03:28:39,591] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 106 + 9: [2023-05-13 03:28:39,593] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 79 +13: [2023-05-13 03:28:39,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt. +13: [2023-05-13 03:28:39,594] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 109 +13: [2023-05-13 03:28:39,597] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 106 +13: [2023-05-13 03:28:39,599] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 109 + 1: [2023-05-13 03:28:39,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt. + 1: [2023-05-13 03:28:39,602] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 14 +14: [2023-05-13 03:28:39,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt. +14: [2023-05-13 03:28:39,604] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 112 +30: [2023-05-13 03:28:39,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt. +30: [2023-05-13 03:28:39,604] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 246 + 1: [2023-05-13 03:28:39,607] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 14 +27: [2023-05-13 03:28:39,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt. +27: [2023-05-13 03:28:39,609] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 222 +14: [2023-05-13 03:28:39,609] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 112 +30: [2023-05-13 03:28:39,609] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 246 +27: [2023-05-13 03:28:39,615] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 222 +14: [2023-05-13 03:28:39,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt. +14: [2023-05-13 03:28:39,618] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 119 +29: [2023-05-13 03:28:39,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt. +29: [2023-05-13 03:28:39,624] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 233 +14: [2023-05-13 03:28:39,623] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 119 +29: [2023-05-13 03:28:39,629] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 233 +14: [2023-05-13 03:28:39,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt. +14: [2023-05-13 03:28:39,634] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 116 +21: [2023-05-13 03:28:39,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt. +21: [2023-05-13 03:28:39,637] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 171 +14: [2023-05-13 03:28:39,639] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 116 + 7: [2023-05-13 03:28:39,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt. +21: [2023-05-13 03:28:39,642] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 171 + 7: [2023-05-13 03:28:39,643] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 62 +13: [2023-05-13 03:28:39,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt. +13: [2023-05-13 03:28:39,646] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 108 + 7: [2023-05-13 03:28:39,647] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 62 +21: [2023-05-13 03:28:39,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt. +21: [2023-05-13 03:28:39,648] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 170 +21: [2023-05-13 03:28:39,653] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 170 +13: [2023-05-13 03:28:39,655] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 108 +30: [2023-05-13 03:28:39,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt. +30: [2023-05-13 03:28:39,656] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 240 +28: [2023-05-13 03:28:39,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt. +28: [2023-05-13 03:28:39,660] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 229 +30: [2023-05-13 03:28:39,661] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 240 +14: [2023-05-13 03:28:39,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt. +14: [2023-05-13 03:28:39,664] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 114 +28: [2023-05-13 03:28:39,667] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 229 +14: [2023-05-13 03:28:39,669] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 114 +21: [2023-05-13 03:28:39,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt. +21: [2023-05-13 03:28:39,671] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 173 +21: [2023-05-13 03:28:39,676] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 173 +13: [2023-05-13 03:28:39,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt. +13: [2023-05-13 03:28:39,679] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 110 +27: [2023-05-13 03:28:39,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt. +27: [2023-05-13 03:28:39,681] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 216 +13: [2023-05-13 03:28:39,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt. +30: [2023-05-13 03:28:39,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt. +30: [2023-05-13 03:28:39,684] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 245 +13: [2023-05-13 03:28:39,685] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 107 +13: [2023-05-13 03:28:39,685] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 110 +27: [2023-05-13 03:28:39,687] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 216 +14: [2023-05-13 03:28:39,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt. +14: [2023-05-13 03:28:39,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt. +14: [2023-05-13 03:28:39,688] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 113 +14: [2023-05-13 03:28:39,688] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 118 +30: [2023-05-13 03:28:39,689] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 245 +13: [2023-05-13 03:28:39,690] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 107 +10: [2023-05-13 03:28:39,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt. +10: [2023-05-13 03:28:39,692] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 84 +14: [2023-05-13 03:28:39,693] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 118 +14: [2023-05-13 03:28:39,693] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 113 +29: [2023-05-13 03:28:39,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt. +29: [2023-05-13 03:28:39,694] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 238 +10: [2023-05-13 03:28:39,698] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 84 +14: [2023-05-13 03:28:39,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt. +14: [2023-05-13 03:28:39,699] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 115 +29: [2023-05-13 03:28:39,700] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 238 +14: [2023-05-13 03:28:39,705] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 115 + 6: [2023-05-13 03:28:39,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt. + 6: [2023-05-13 03:28:39,706] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 50 +21: [2023-05-13 03:28:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt. +21: [2023-05-13 03:28:39,708] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 168 + 1: [2023-05-13 03:28:39,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt. + 1: [2023-05-13 03:28:39,709] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 12 +30: [2023-05-13 03:28:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt. +30: [2023-05-13 03:28:39,710] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 244 +10: [2023-05-13 03:28:39,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt. +10: [2023-05-13 03:28:39,711] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 86 + 6: [2023-05-13 03:28:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt. + 9: [2023-05-13 03:28:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt. + 6: [2023-05-13 03:28:39,712] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 55 + 7: [2023-05-13 03:28:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt. + 9: [2023-05-13 03:28:39,712] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 77 + 6: [2023-05-13 03:28:39,712] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 50 + 7: [2023-05-13 03:28:39,712] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 59 +21: [2023-05-13 03:28:39,713] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 168 +14: [2023-05-13 03:28:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt. +14: [2023-05-13 03:28:39,714] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 117 +30: [2023-05-13 03:28:39,715] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 244 + 1: [2023-05-13 03:28:39,715] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 12 +10: [2023-05-13 03:28:39,716] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 86 + 1: [2023-05-13 03:28:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt. + 9: [2023-05-13 03:28:39,717] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 77 + 1: [2023-05-13 03:28:39,718] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 13 + 5: [2023-05-13 03:28:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt. +10: [2023-05-13 03:28:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt. +10: [2023-05-13 03:28:39,719] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 85 + 5: [2023-05-13 03:28:39,719] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 42 + 7: [2023-05-13 03:28:39,719] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 59 + 6: [2023-05-13 03:28:39,719] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 55 +14: [2023-05-13 03:28:39,720] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 117 + 5: [2023-05-13 03:28:39,724] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 42 +10: [2023-05-13 03:28:39,724] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 85 + 1: [2023-05-13 03:28:39,725] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 13 + 7: [2023-05-13 03:28:39,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt. + 7: [2023-05-13 03:28:39,730] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 61 + 7: [2023-05-13 03:28:39,735] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 61 +30: [2023-05-13 03:28:39,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt. +30: [2023-05-13 03:28:39,736] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 247 + 9: [2023-05-13 03:28:39,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt. + 9: [2023-05-13 03:28:39,738] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 78 +21: [2023-05-13 03:28:39,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt. +21: [2023-05-13 03:28:39,740] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 172 +30: [2023-05-13 03:28:39,741] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 247 + 9: [2023-05-13 03:28:39,744] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 78 + 9: [2023-05-13 03:28:39,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt. + 9: [2023-05-13 03:28:39,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt. + 9: [2023-05-13 03:28:39,744] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 75 + 9: [2023-05-13 03:28:39,745] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 72 +21: [2023-05-13 03:28:39,745] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 172 + 6: [2023-05-13 03:28:39,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt. + 6: [2023-05-13 03:28:39,746] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 51 +11: [2023-05-13 03:28:39,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt. +11: [2023-05-13 03:28:39,748] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 88 +13: [2023-05-13 03:28:39,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt. +13: [2023-05-13 03:28:39,750] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 105 + 9: [2023-05-13 03:28:39,750] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 75 + 9: [2023-05-13 03:28:39,750] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 72 +30: [2023-05-13 03:28:39,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt. +30: [2023-05-13 03:28:39,751] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 242 + 6: [2023-05-13 03:28:39,753] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 51 +11: [2023-05-13 03:28:39,753] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 88 +13: [2023-05-13 03:28:39,755] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 105 +30: [2023-05-13 03:28:39,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt. +30: [2023-05-13 03:28:39,755] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 243 +23: [2023-05-13 03:28:39,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt. + 7: [2023-05-13 03:28:39,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt. +23: [2023-05-13 03:28:39,756] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 184 + 7: [2023-05-13 03:28:39,756] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 56 +30: [2023-05-13 03:28:39,757] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 242 +18: [2023-05-13 03:28:39,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt. +18: [2023-05-13 03:28:39,758] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 145 +29: [2023-05-13 03:28:39,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt. +29: [2023-05-13 03:28:39,759] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 237 + 7: [2023-05-13 03:28:39,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt. +30: [2023-05-13 03:28:39,761] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 243 + 7: [2023-05-13 03:28:39,761] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 63 +31: [2023-05-13 03:28:39,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt. +23: [2023-05-13 03:28:39,762] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 184 +31: [2023-05-13 03:28:39,762] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 248 + 7: [2023-05-13 03:28:39,762] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 56 +21: [2023-05-13 03:28:39,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt. +21: [2023-05-13 03:28:39,764] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 174 +18: [2023-05-13 03:28:39,764] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 145 +29: [2023-05-13 03:28:39,765] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 237 + 7: [2023-05-13 03:28:39,766] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 63 +13: [2023-05-13 03:28:39,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt. +13: [2023-05-13 03:28:39,767] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 104 +31: [2023-05-13 03:28:39,768] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 248 +22: [2023-05-13 03:28:39,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt. +22: [2023-05-13 03:28:39,768] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 178 +21: [2023-05-13 03:28:39,769] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 174 +11: [2023-05-13 03:28:39,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt. + 5: [2023-05-13 03:28:39,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt. +16: [2023-05-13 03:28:39,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt. +11: [2023-05-13 03:28:39,771] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 95 +16: [2023-05-13 03:28:39,771] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 131 +29: [2023-05-13 03:28:39,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt. + 5: [2023-05-13 03:28:39,771] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 45 +29: [2023-05-13 03:28:39,771] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 234 +13: [2023-05-13 03:28:39,773] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 104 +22: [2023-05-13 03:28:39,774] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 178 + 5: [2023-05-13 03:28:39,776] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 45 +16: [2023-05-13 03:28:39,777] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 131 +29: [2023-05-13 03:28:39,777] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 234 + 1: [2023-05-13 03:28:39,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt. +11: [2023-05-13 03:28:39,777] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 95 + 1: [2023-05-13 03:28:39,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt. + 1: [2023-05-13 03:28:39,778] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 15 + 1: [2023-05-13 03:28:39,778] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 10 +25: [2023-05-13 03:28:39,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt. +25: [2023-05-13 03:28:39,779] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 205 + 1: [2023-05-13 03:28:39,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt. + 1: [2023-05-13 03:28:39,780] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 8 +11: [2023-05-13 03:28:39,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt. +11: [2023-05-13 03:28:39,781] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 91 + 5: [2023-05-13 03:28:39,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt. + 1: [2023-05-13 03:28:39,784] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 15 + 5: [2023-05-13 03:28:39,784] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 46 +25: [2023-05-13 03:28:39,784] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 205 + 1: [2023-05-13 03:28:39,784] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 10 + 1: [2023-05-13 03:28:39,785] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 8 +11: [2023-05-13 03:28:39,786] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 91 + 1: [2023-05-13 03:28:39,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt. + 9: [2023-05-13 03:28:39,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt. + 5: [2023-05-13 03:28:39,789] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 46 + 9: [2023-05-13 03:28:39,789] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 73 + 1: [2023-05-13 03:28:39,789] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 11 + 8: [2023-05-13 03:28:39,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt. + 2: [2023-05-13 03:28:39,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt. +31: [2023-05-13 03:28:39,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt. +31: [2023-05-13 03:28:39,791] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 255 + 2: [2023-05-13 03:28:39,791] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 20 + 8: [2023-05-13 03:28:39,791] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 67 + 9: [2023-05-13 03:28:39,794] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 73 + 1: [2023-05-13 03:28:39,794] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 11 +31: [2023-05-13 03:28:39,795] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 255 + 8: [2023-05-13 03:28:39,796] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 67 +15: [2023-05-13 03:28:39,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt. + 2: [2023-05-13 03:28:39,797] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 20 +15: [2023-05-13 03:28:39,797] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 121 +15: [2023-05-13 03:28:39,803] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 121 +28: [2023-05-13 03:28:39,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt. +28: [2023-05-13 03:28:39,806] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 226 +28: [2023-05-13 03:28:39,810] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 226 + 6: [2023-05-13 03:28:39,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt. + 6: [2023-05-13 03:28:39,811] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 49 + 0: [2023-05-13 03:28:39,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt. + 0: [2023-05-13 03:28:39,812] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 3 +29: [2023-05-13 03:28:39,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt. +21: [2023-05-13 03:28:39,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt. +29: [2023-05-13 03:28:39,813] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 239 +29: [2023-05-13 03:28:39,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt. +29: [2023-05-13 03:28:39,814] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 236 +21: [2023-05-13 03:28:39,814] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 175 + 6: [2023-05-13 03:28:39,817] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 49 +19: [2023-05-13 03:28:39,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt. +19: [2023-05-13 03:28:39,817] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 158 + 0: [2023-05-13 03:28:39,817] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 3 +22: [2023-05-13 03:28:39,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt. +22: [2023-05-13 03:28:39,818] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 181 +29: [2023-05-13 03:28:39,819] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 239 +21: [2023-05-13 03:28:39,820] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 175 +29: [2023-05-13 03:28:39,821] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 236 +19: [2023-05-13 03:28:39,822] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 158 +22: [2023-05-13 03:28:39,823] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 181 +19: [2023-05-13 03:28:39,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt. +19: [2023-05-13 03:28:39,825] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 159 + 5: [2023-05-13 03:28:39,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt. + 5: [2023-05-13 03:28:39,826] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 43 +23: [2023-05-13 03:28:39,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt. +23: [2023-05-13 03:28:39,826] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 186 + 0: [2023-05-13 03:28:39,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt. + 0: [2023-05-13 03:28:39,827] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 2 +24: [2023-05-13 03:28:39,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt. +24: [2023-05-13 03:28:39,830] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 192 +28: [2023-05-13 03:28:39,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt. +28: [2023-05-13 03:28:39,830] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 225 +19: [2023-05-13 03:28:39,830] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 159 + 5: [2023-05-13 03:28:39,831] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 43 +23: [2023-05-13 03:28:39,831] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 186 + 0: [2023-05-13 03:28:39,833] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 2 +24: [2023-05-13 03:28:39,835] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 192 +23: [2023-05-13 03:28:39,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt. +28: [2023-05-13 03:28:39,835] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 225 +23: [2023-05-13 03:28:39,836] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 189 + 6: [2023-05-13 03:28:39,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt. + 6: [2023-05-13 03:28:39,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt. + 0: [2023-05-13 03:28:39,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt. + 6: [2023-05-13 03:28:39,837] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 53 + 0: [2023-05-13 03:28:39,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt. + 6: [2023-05-13 03:28:39,837] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 54 +19: [2023-05-13 03:28:39,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt. + 0: [2023-05-13 03:28:39,837] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 4 +19: [2023-05-13 03:28:39,837] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 157 + 0: [2023-05-13 03:28:39,838] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 7 + 2: [2023-05-13 03:28:39,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt. + 0: [2023-05-13 03:28:39,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt. +13: [2023-05-13 03:28:39,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt. + 2: [2023-05-13 03:28:39,839] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 18 + 0: [2023-05-13 03:28:39,839] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 0 +13: [2023-05-13 03:28:39,839] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 111 +19: [2023-05-13 03:28:39,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt. +19: [2023-05-13 03:28:39,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt. +23: [2023-05-13 03:28:39,841] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 189 +19: [2023-05-13 03:28:39,841] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 156 +19: [2023-05-13 03:28:39,841] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 155 + 6: [2023-05-13 03:28:39,842] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 53 + 6: [2023-05-13 03:28:39,843] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 54 +26: [2023-05-13 03:28:39,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt. + 0: [2023-05-13 03:28:39,844] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 4 +26: [2023-05-13 03:28:39,844] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 208 + 0: [2023-05-13 03:28:39,844] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 7 + 2: [2023-05-13 03:28:39,844] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 18 +19: [2023-05-13 03:28:39,845] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 157 + 0: [2023-05-13 03:28:39,845] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 0 +13: [2023-05-13 03:28:39,846] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 111 +19: [2023-05-13 03:28:39,846] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 156 +18: [2023-05-13 03:28:39,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt. +19: [2023-05-13 03:28:39,847] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 155 +18: [2023-05-13 03:28:39,847] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 144 +11: [2023-05-13 03:28:39,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt. +11: [2023-05-13 03:28:39,849] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 94 +26: [2023-05-13 03:28:39,849] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 208 +25: [2023-05-13 03:28:39,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt. +25: [2023-05-13 03:28:39,850] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 204 + 0: could not find arguments in the checkpoint ... + 0: checkpoint version 3.0 +18: [2023-05-13 03:28:39,852] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 144 +11: [2023-05-13 03:28:39,853] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 94 +11: [2023-05-13 03:28:39,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt. +11: [2023-05-13 03:28:39,854] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 89 + 0: [2023-05-13 03:28:39,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt. + 0: [2023-05-13 03:28:39,855] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 5 +16: [2023-05-13 03:28:39,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt. +16: [2023-05-13 03:28:39,856] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 129 + 9: [2023-05-13 03:28:39,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt. +25: [2023-05-13 03:28:39,858] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 204 + 9: [2023-05-13 03:28:39,858] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 74 + 7: [2023-05-13 03:28:39,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt. +11: [2023-05-13 03:28:39,859] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 89 + 7: [2023-05-13 03:28:39,860] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 60 + 0: [2023-05-13 03:28:39,860] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 5 + 8: [2023-05-13 03:28:39,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt. + 8: [2023-05-13 03:28:39,861] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 64 +16: [2023-05-13 03:28:39,861] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 129 +16: [2023-05-13 03:28:39,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt. +16: [2023-05-13 03:28:39,864] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 135 + 9: [2023-05-13 03:28:39,864] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 74 + 7: [2023-05-13 03:28:39,866] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 60 +17: [2023-05-13 03:28:39,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt. +17: [2023-05-13 03:28:39,866] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 140 + 8: [2023-05-13 03:28:39,866] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 64 +16: [2023-05-13 03:28:39,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt. +16: [2023-05-13 03:28:39,867] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 132 +16: [2023-05-13 03:28:39,869] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 135 + 2: [2023-05-13 03:28:39,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt. +17: [2023-05-13 03:28:39,872] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 140 + 2: [2023-05-13 03:28:39,872] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 17 +16: [2023-05-13 03:28:39,872] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 132 +31: [2023-05-13 03:28:39,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt. +31: [2023-05-13 03:28:39,874] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 253 +24: [2023-05-13 03:28:39,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt. + 3: [2023-05-13 03:28:39,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt. +25: [2023-05-13 03:28:39,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt. + 2: [2023-05-13 03:28:39,877] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 17 +24: [2023-05-13 03:28:39,877] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 196 +25: [2023-05-13 03:28:39,877] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 200 + 3: [2023-05-13 03:28:39,878] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 31 +31: [2023-05-13 03:28:39,879] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 253 +27: [2023-05-13 03:28:39,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt. +27: [2023-05-13 03:28:39,879] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 218 +25: [2023-05-13 03:28:39,882] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 200 +24: [2023-05-13 03:28:39,882] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 196 + 3: [2023-05-13 03:28:39,883] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 31 +22: [2023-05-13 03:28:39,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt. +22: [2023-05-13 03:28:39,884] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 182 +27: [2023-05-13 03:28:39,885] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 218 +22: [2023-05-13 03:28:39,890] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 182 + 3: [2023-05-13 03:28:39,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt. + 3: [2023-05-13 03:28:39,891] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 24 + 2: [2023-05-13 03:28:39,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt. + 2: [2023-05-13 03:28:39,892] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 16 +12: [2023-05-13 03:28:39,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt. +12: [2023-05-13 03:28:39,893] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 100 +25: [2023-05-13 03:28:39,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt. +25: [2023-05-13 03:28:39,897] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 207 + 3: [2023-05-13 03:28:39,897] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 24 + 2: [2023-05-13 03:28:39,898] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 16 +12: [2023-05-13 03:28:39,899] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 100 +25: [2023-05-13 03:28:39,903] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 207 +16: [2023-05-13 03:28:39,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt. +16: [2023-05-13 03:28:39,906] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 130 +18: [2023-05-13 03:28:39,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt. +18: [2023-05-13 03:28:39,907] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 149 + 0: [2023-05-13 03:28:39,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt. + 0: [2023-05-13 03:28:39,909] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 1 + 8: [2023-05-13 03:28:39,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt. + 8: [2023-05-13 03:28:39,909] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 69 + 2: [2023-05-13 03:28:39,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt. +16: [2023-05-13 03:28:39,911] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 130 + 2: [2023-05-13 03:28:39,911] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 21 +18: [2023-05-13 03:28:39,912] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 149 +12: [2023-05-13 03:28:39,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt. +12: [2023-05-13 03:28:39,912] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 102 + 0: [2023-05-13 03:28:39,914] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 1 + 8: [2023-05-13 03:28:39,915] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 69 + 5: [2023-05-13 03:28:39,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt. + 8: [2023-05-13 03:28:39,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt. + 5: [2023-05-13 03:28:39,916] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 41 + 8: [2023-05-13 03:28:39,916] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 68 +20: [2023-05-13 03:28:39,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt. +20: [2023-05-13 03:28:39,916] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 164 + 2: [2023-05-13 03:28:39,917] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 21 +12: [2023-05-13 03:28:39,917] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 102 +31: [2023-05-13 03:28:39,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt. +31: [2023-05-13 03:28:39,918] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 249 +23: [2023-05-13 03:28:39,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt. +23: [2023-05-13 03:28:39,920] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 187 +11: [2023-05-13 03:28:39,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt. + 8: [2023-05-13 03:28:39,920] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 68 +11: [2023-05-13 03:28:39,921] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 93 + 5: [2023-05-13 03:28:39,921] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 41 +20: [2023-05-13 03:28:39,922] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 164 +31: [2023-05-13 03:28:39,923] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 249 +26: [2023-05-13 03:28:39,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt. +17: [2023-05-13 03:28:39,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt. +26: [2023-05-13 03:28:39,923] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 211 +17: [2023-05-13 03:28:39,923] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 136 + 2: [2023-05-13 03:28:39,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt. + 2: [2023-05-13 03:28:39,924] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 22 + 0: [2023-05-13 03:28:39,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt. +23: [2023-05-13 03:28:39,925] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 187 +20: [2023-05-13 03:28:39,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt. +20: [2023-05-13 03:28:39,926] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 161 + 0: [2023-05-13 03:28:39,926] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 6 +11: [2023-05-13 03:28:39,926] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 93 +25: [2023-05-13 03:28:39,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt. +25: [2023-05-13 03:28:39,926] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 203 +11: [2023-05-13 03:28:39,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt. +11: [2023-05-13 03:28:39,927] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 90 +26: [2023-05-13 03:28:39,928] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 211 +17: [2023-05-13 03:28:39,928] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 136 + 2: [2023-05-13 03:28:39,929] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 22 +19: [2023-05-13 03:28:39,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt. +19: [2023-05-13 03:28:39,930] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 154 +20: [2023-05-13 03:28:39,931] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 161 +25: [2023-05-13 03:28:39,932] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 203 +11: [2023-05-13 03:28:39,932] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 90 +28: [2023-05-13 03:28:39,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt. +28: [2023-05-13 03:28:39,932] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 230 +18: [2023-05-13 03:28:39,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt. +18: [2023-05-13 03:28:39,934] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 147 +24: [2023-05-13 03:28:39,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt. +18: [2023-05-13 03:28:39,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt. +24: [2023-05-13 03:28:39,935] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 195 + 0: [2023-05-13 03:28:39,935] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 6 +18: [2023-05-13 03:28:39,935] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 148 +31: [2023-05-13 03:28:39,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt. + 3: [2023-05-13 03:28:39,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt. +31: [2023-05-13 03:28:39,935] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 251 + 3: [2023-05-13 03:28:39,936] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 29 +19: [2023-05-13 03:28:39,936] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 154 + 5: [2023-05-13 03:28:39,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt. + 5: [2023-05-13 03:28:39,937] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 40 +27: [2023-05-13 03:28:39,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt. +19: [2023-05-13 03:28:39,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt. +27: [2023-05-13 03:28:39,938] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 217 +28: [2023-05-13 03:28:39,938] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 230 +19: [2023-05-13 03:28:39,938] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 153 +26: [2023-05-13 03:28:39,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt. +26: [2023-05-13 03:28:39,939] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 214 +31: [2023-05-13 03:28:39,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt. +31: [2023-05-13 03:28:39,940] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 252 +24: [2023-05-13 03:28:39,940] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 195 +18: [2023-05-13 03:28:39,940] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 147 +18: [2023-05-13 03:28:39,940] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 148 +31: [2023-05-13 03:28:39,941] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 251 +26: [2023-05-13 03:28:39,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt. +26: [2023-05-13 03:28:39,941] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 213 + 3: [2023-05-13 03:28:39,941] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 29 + 5: [2023-05-13 03:28:39,941] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 40 +27: [2023-05-13 03:28:39,943] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 217 +22: [2023-05-13 03:28:39,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt. +22: [2023-05-13 03:28:39,943] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 179 +23: [2023-05-13 03:28:39,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt. +23: [2023-05-13 03:28:39,944] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 190 +26: [2023-05-13 03:28:39,945] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 214 + 3: [2023-05-13 03:28:39,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt. +31: [2023-05-13 03:28:39,945] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 252 + 3: [2023-05-13 03:28:39,945] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 30 +19: [2023-05-13 03:28:39,946] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 153 +12: [2023-05-13 03:28:39,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt. +12: [2023-05-13 03:28:39,946] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 103 +26: [2023-05-13 03:28:39,947] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 213 +22: [2023-05-13 03:28:39,948] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 179 +23: [2023-05-13 03:28:39,950] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 190 +19: [2023-05-13 03:28:39,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt. +19: [2023-05-13 03:28:39,950] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 152 + 3: [2023-05-13 03:28:39,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt. + 3: [2023-05-13 03:28:39,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt. + 3: [2023-05-13 03:28:39,952] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 27 + 3: [2023-05-13 03:28:39,953] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 28 +12: [2023-05-13 03:28:39,953] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 103 + 2: [2023-05-13 03:28:39,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt. + 3: [2023-05-13 03:28:39,954] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 30 + 2: [2023-05-13 03:28:39,954] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 23 +28: [2023-05-13 03:28:39,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt. +28: [2023-05-13 03:28:39,955] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 228 +19: [2023-05-13 03:28:39,956] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 152 + 5: [2023-05-13 03:28:39,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt. + 5: [2023-05-13 03:28:39,956] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 44 + 3: [2023-05-13 03:28:39,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt. + 3: [2023-05-13 03:28:39,957] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 26 + 4: [2023-05-13 03:28:39,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt. + 3: [2023-05-13 03:28:39,958] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 27 + 3: [2023-05-13 03:28:39,959] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 28 + 4: [2023-05-13 03:28:39,959] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 32 + 5: [2023-05-13 03:28:39,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt. + 5: [2023-05-13 03:28:39,960] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 47 + 2: [2023-05-13 03:28:39,960] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 23 + 3: [2023-05-13 03:28:39,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt. +28: [2023-05-13 03:28:39,961] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 228 + 3: [2023-05-13 03:28:39,961] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 25 + 5: [2023-05-13 03:28:39,961] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 44 + 3: [2023-05-13 03:28:39,962] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 26 +31: [2023-05-13 03:28:39,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt. +31: [2023-05-13 03:28:39,963] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 250 + 4: [2023-05-13 03:28:39,964] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 32 + 5: [2023-05-13 03:28:39,964] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 47 + 3: [2023-05-13 03:28:39,966] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 25 +31: [2023-05-13 03:28:39,968] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 250 +16: [2023-05-13 03:28:39,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt. +16: [2023-05-13 03:28:39,973] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 133 + 8: [2023-05-13 03:28:39,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt. +17: [2023-05-13 03:28:39,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt. + 8: [2023-05-13 03:28:39,976] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 66 +17: [2023-05-13 03:28:39,976] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 137 +12: [2023-05-13 03:28:39,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt. +12: [2023-05-13 03:28:39,977] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 99 +16: [2023-05-13 03:28:39,978] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 133 + 8: [2023-05-13 03:28:39,982] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 66 +12: [2023-05-13 03:28:39,982] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 99 +17: [2023-05-13 03:28:39,982] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 137 +26: [2023-05-13 03:28:39,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt. +26: [2023-05-13 03:28:39,983] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 212 +23: [2023-05-13 03:28:39,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt. +23: [2023-05-13 03:28:39,983] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 188 +24: [2023-05-13 03:28:39,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt. +22: [2023-05-13 03:28:39,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt. +24: [2023-05-13 03:28:39,986] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 199 +22: [2023-05-13 03:28:39,986] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 177 + 8: [2023-05-13 03:28:39,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt. + 8: [2023-05-13 03:28:39,987] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 65 +17: [2023-05-13 03:28:39,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt. +17: [2023-05-13 03:28:39,988] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 143 +23: [2023-05-13 03:28:39,988] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 188 +26: [2023-05-13 03:28:39,989] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 212 +18: [2023-05-13 03:28:39,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt. +18: [2023-05-13 03:28:39,990] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 151 +12: [2023-05-13 03:28:39,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt. +22: [2023-05-13 03:28:39,992] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 177 +12: [2023-05-13 03:28:39,992] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 98 +24: [2023-05-13 03:28:39,992] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 199 + 8: [2023-05-13 03:28:39,992] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 65 +11: [2023-05-13 03:28:39,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt. +11: [2023-05-13 03:28:39,993] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 92 +17: [2023-05-13 03:28:39,993] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 143 +12: [2023-05-13 03:28:39,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt. +12: [2023-05-13 03:28:39,994] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 96 +18: [2023-05-13 03:28:39,996] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 151 +12: [2023-05-13 03:28:39,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt. +26: [2023-05-13 03:28:39,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt. +26: [2023-05-13 03:28:39,997] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 209 +12: [2023-05-13 03:28:39,997] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 101 +12: [2023-05-13 03:28:39,998] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 98 +17: [2023-05-13 03:28:39,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt. +17: [2023-05-13 03:28:40,000] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 142 +11: [2023-05-13 03:28:40,000] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 92 +12: [2023-05-13 03:28:40,001] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 96 +23: [2023-05-13 03:28:40,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt. +23: [2023-05-13 03:28:40,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt. +23: [2023-05-13 03:28:40,001] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 185 +23: [2023-05-13 03:28:40,001] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 191 + 4: [2023-05-13 03:28:40,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt. + 4: [2023-05-13 03:28:40,002] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 38 +12: [2023-05-13 03:28:40,003] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 101 +26: [2023-05-13 03:28:40,003] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 209 +17: [2023-05-13 03:28:40,005] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 142 +23: [2023-05-13 03:28:40,006] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 191 +23: [2023-05-13 03:28:40,006] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 185 +26: [2023-05-13 03:28:40,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt. +17: [2023-05-13 03:28:40,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt. +26: [2023-05-13 03:28:40,008] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 215 + 4: [2023-05-13 03:28:40,008] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 38 + 4: [2023-05-13 03:28:40,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt. +17: [2023-05-13 03:28:40,008] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 139 + 4: [2023-05-13 03:28:40,009] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 37 + 4: [2023-05-13 03:28:40,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt. + 4: [2023-05-13 03:28:40,010] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 34 + 6: [2023-05-13 03:28:40,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt. + 1: [2023-05-13 03:28:40,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt. + 6: [2023-05-13 03:28:40,011] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 52 + 1: [2023-05-13 03:28:40,011] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 9 +26: [2023-05-13 03:28:40,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt. +31: [2023-05-13 03:28:40,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt. +31: [2023-05-13 03:28:40,012] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 254 +26: [2023-05-13 03:28:40,012] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 210 +26: [2023-05-13 03:28:40,013] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 215 + 4: [2023-05-13 03:28:40,013] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 37 +17: [2023-05-13 03:28:40,013] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 139 +25: [2023-05-13 03:28:40,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt. +25: [2023-05-13 03:28:40,015] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 206 + 4: [2023-05-13 03:28:40,016] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 34 +31: [2023-05-13 03:28:40,016] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 254 + 1: [2023-05-13 03:28:40,016] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 9 +26: [2023-05-13 03:28:40,017] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 210 + 6: [2023-05-13 03:28:40,017] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 52 +20: [2023-05-13 03:28:40,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt. +20: [2023-05-13 03:28:40,019] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 167 +24: [2023-05-13 03:28:40,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt. +24: [2023-05-13 03:28:40,019] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 197 +25: [2023-05-13 03:28:40,021] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 206 +20: [2023-05-13 03:28:40,024] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 167 +24: [2023-05-13 03:28:40,024] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 197 + 8: [2023-05-13 03:28:40,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt. + 8: [2023-05-13 03:28:40,026] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 71 + 8: [2023-05-13 03:28:40,030] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 71 +17: [2023-05-13 03:28:40,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt. +17: [2023-05-13 03:28:40,033] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 141 +20: [2023-05-13 03:28:40,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt. +17: [2023-05-13 03:28:40,038] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 141 +20: [2023-05-13 03:28:40,038] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 165 + 8: [2023-05-13 03:28:40,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt. + 8: [2023-05-13 03:28:40,040] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 70 +20: [2023-05-13 03:28:40,044] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 165 + 8: [2023-05-13 03:28:40,045] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 70 +17: [2023-05-13 03:28:40,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt. +17: [2023-05-13 03:28:40,046] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 138 + 4: [2023-05-13 03:28:40,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt. + 4: [2023-05-13 03:28:40,049] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 35 +17: [2023-05-13 03:28:40,051] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 138 +24: [2023-05-13 03:28:40,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt. +24: [2023-05-13 03:28:40,051] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 198 + 4: [2023-05-13 03:28:40,054] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 35 +24: [2023-05-13 03:28:40,056] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 198 +20: [2023-05-13 03:28:40,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt. +20: [2023-05-13 03:28:40,070] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 166 +24: [2023-05-13 03:28:40,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt. +24: [2023-05-13 03:28:40,074] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 193 +20: [2023-05-13 03:28:40,075] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 166 +24: [2023-05-13 03:28:40,079] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 193 +22: [2023-05-13 03:28:40,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt. +22: [2023-05-13 03:28:40,080] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 183 +22: [2023-05-13 03:28:40,086] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 183 + 4: [2023-05-13 03:28:40,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt. + 4: [2023-05-13 03:28:40,100] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 36 + 4: [2023-05-13 03:28:40,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt. + 4: [2023-05-13 03:28:40,103] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 39 + 4: [2023-05-13 03:28:40,105] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 36 + 4: [2023-05-13 03:28:40,108] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 39 + 2: [2023-05-13 03:28:40,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt. + 2: [2023-05-13 03:28:40,110] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 19 + 2: [2023-05-13 03:28:40,116] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 19 +20: [2023-05-13 03:28:40,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt. +20: [2023-05-13 03:28:40,124] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 162 +20: [2023-05-13 03:28:40,132] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 162 +24: [2023-05-13 03:28:40,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt. +24: [2023-05-13 03:28:40,139] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 194 +24: [2023-05-13 03:28:40,144] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 194 +20: [2023-05-13 03:28:40,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt. +20: [2023-05-13 03:28:40,148] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 163 +20: [2023-05-13 03:28:40,154] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 163 +20: [2023-05-13 03:28:40,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt. +20: [2023-05-13 03:28:40,155] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 160 +20: [2023-05-13 03:28:40,160] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 160 +27: [2023-05-13 03:28:40,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt. +27: [2023-05-13 03:28:40,213] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 223 +27: [2023-05-13 03:28:40,219] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 223 + 9: [2023-05-13 03:28:40,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt. + 9: [2023-05-13 03:28:40,290] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 76 + 9: [2023-05-13 03:28:40,295] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 76 +29: [2023-05-13 03:28:40,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt. +29: [2023-05-13 03:28:40,553] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 232 +29: [2023-05-13 03:28:40,559] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 232 +16: [2023-05-13 03:28:40,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt. +16: [2023-05-13 03:28:40,569] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 134 +16: [2023-05-13 03:28:40,573] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 134 +16: [2023-05-13 03:28:40,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt. +16: [2023-05-13 03:28:40,590] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 128 +16: [2023-05-13 03:28:40,595] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 128 +25: [2023-05-13 03:28:40,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt. +25: [2023-05-13 03:28:40,640] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 201 +25: [2023-05-13 03:28:40,644] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 201 +12: [2023-05-13 03:28:40,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt. +12: [2023-05-13 03:28:40,702] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 97 +12: [2023-05-13 03:28:40,707] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 97 +22: [2023-05-13 03:28:40,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt. +22: [2023-05-13 03:28:40,840] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 180 +22: [2023-05-13 03:28:40,845] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 180 + 6: [2023-05-13 03:28:40,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt. + 6: [2023-05-13 03:28:40,944] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 48 + 6: [2023-05-13 03:28:40,951] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 48 +21: [2023-05-13 03:28:40,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt. +21: [2023-05-13 03:28:40,981] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 169 +21: [2023-05-13 03:28:40,987] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 169 +22: [2023-05-13 03:28:41,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt. +22: [2023-05-13 03:28:41,106] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 176 +22: [2023-05-13 03:28:41,111] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 176 +25: [2023-05-13 03:28:41,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt. +25: [2023-05-13 03:28:41,161] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 202 +25: [2023-05-13 03:28:41,166] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 202 + 4: [2023-05-13 03:28:41,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt. + 4: [2023-05-13 03:28:41,490] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 33 + 4: [2023-05-13 03:28:41,495] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 33 +18: [2023-05-13 03:28:41,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt. +18: [2023-05-13 03:28:41,553] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 146 +18: [2023-05-13 03:28:41,557] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 146 +18: [2023-05-13 03:28:42,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt. +18: [2023-05-13 03:28:42,135] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 150 +18: [2023-05-13 03:28:42,140] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 150 +29: [2023-05-13 03:28:42,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25/global_step52452/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt. +29: [2023-05-13 03:28:42,271] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 256 ZeRO state_dicts for rank 235 +29: [2023-05-13 03:28:42,276] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 256 zero partition checkpoints for rank 235 + 0: successfully loaded checkpoint from lm1-2b8-55b-c4-repetitions/perplexity25 at iteration 0 +31: time (ms) | load-checkpoint: 22933.80 + 0: estimated model parameters: 2.80902656 + 0: estimated model parameters without embeddings: 2.67500544 + 0: [after model, optimizer, and learning rate scheduler are built] datetime: 2023-05-13 03:28:43 + 0: > building train, validation, and test datasets ... + 0: > datasets target sizes (minimum size): + 0: train: 1 + 0: validation: 51200 + 0: test: 51200 + 0: > building train, validation, and test datasets for GPT ... + 0: > building dataset index ... + 0: reading sizes... + 0: reading pointers... + 0: reading document index... + 0: creating numpy buffer of mmap... + 0: creating memory view of numpy buffer... + 0: > finished creating indexed dataset in 0.053807 seconds + 0: number of documents: 3133972 + 0: > dataset split: + 0: train: + 0: document indices in [0, 3133972) total of 3133972 documents + 0: > loading doc-idx mapping from /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_1B5_text_document_train_indexmap_1ns_2048sl_1234s_doc_idx.npy + 0: > loading sample-idx mapping from /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_1B5_text_document_train_indexmap_1ns_2048sl_1234s_sample_idx.npy + 0: > loading shuffle-idx mapping from /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_1B5_text_document_train_indexmap_1ns_2048sl_1234s_shuffle_idx.npy + 0: loaded indexed file in 0.139 seconds + 0: total number of samples: 731002 + 0: total number of epochs: 1 + 0: > building dataset index ... + 0: reading sizes... + 0: reading pointers... + 0: reading document index... + 0: creating numpy buffer of mmap... + 0: creating memory view of numpy buffer... + 0: > finished creating indexed dataset in 0.106472 seconds + 0: number of documents: 364608 + 0: > dataset split: + 0: validation: + 0: document indices in [0, 364608) total of 364608 documents + 0: > loading doc-idx mapping from /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document_validation_indexmap_51200ns_2048sl_1234s_doc_idx.npy + 0: > loading sample-idx mapping from /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document_validation_indexmap_51200ns_2048sl_1234s_sample_idx.npy + 0: > loading shuffle-idx mapping from /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document_validation_indexmap_51200ns_2048sl_1234s_shuffle_idx.npy + 0: loaded indexed file in 0.103 seconds + 0: total number of samples: 84978 + 0: total number of epochs: 1 + 0: > finished creating GPT datasets ... + 0: [after dataloaders are built] datetime: 2023-05-13 03:29:05 + 0: done with setup ... + 0: training ... +31: time (ms) | model-and-optimizer-setup: 58877.48 | train/valid/test-data-iterators-setup: 21727.31 + 0: [after training is done] datetime: 2023-05-13 03:29:05 +31: ----------------------------------------------------------------------------------------------------------------- +31: validation loss at the end of training for val data | lm loss value: 2.740080E+00 | lm loss PPL: 1.548822E+01 | +31: ----------------------------------------------------------------------------------------------------------------- +END 3510097: Sat 13 May 2023 03:30:02 AM EEST