gluonnlp == 1251d0501a6c8bb4b4aabac7a5410d3c94ccb82f mxnet == bd39153eaf94e7fbe1aa6fa092e0781a5d6ca25d INFO:root:Namespace(accumulate=2, batch_size=16, batch_size_eval=8, by_token=False, ckpt_dir='/home/ubuntu/ckpt-master/', ckpt_interval=5000, data='/home/ubuntu/book-enwiki/*/*/*.npz', data_eval=None, dataset_name='book_corpus_wiki_en_uncased', do_eval=False, do_training=True, dtype='float16', gpus='0,1,2,3,4,5,6,7', kvstore='device_sync', log_interval=250, lr=0.0001, num_buckets=10, num_steps=1000000, pretrained=False, profile=False, seed=0, start_step=0, verbose=False, warmup_ratio=0.01) [18:30:24] src/kvstore/././comm_tree.h:356: only 32 out of 56 GPU pairs are enabled direct access. It may affect the performance. You can set MXNET_ENABLE_GPU_P2P=0 to turn it off [18:30:24] src/kvstore/././comm_tree.h:365: .vvvv... [18:30:24] src/kvstore/././comm_tree.h:365: v.vv.v.. [18:30:24] src/kvstore/././comm_tree.h:365: vv.v..v. [18:30:24] src/kvstore/././comm_tree.h:365: vvv....v [18:30:24] src/kvstore/././comm_tree.h:365: v....vvv [18:30:24] src/kvstore/././comm_tree.h:365: .v..v.vv [18:30:24] src/kvstore/././comm_tree.h:365: ..v.vv.v [18:30:24] src/kvstore/././comm_tree.h:365: ...vvvv. [18:30:24] src/kvstore/./././gpu_topology.h:216: cudaDeviceGetP2PAttribute incorrect. Falling back to cudaDeviceEnablePeerAccess for topology detection [18:30:24] src/kvstore/././comm_tree.h:380: Using Kernighan-Lin to generate trees [18:30:24] src/kvstore/././comm_tree.h:391: Using Tree [18:30:26] src/kvstore/././comm_tree.h:488: Size 2 occurs 1 times [18:30:26] src/kvstore/././comm_tree.h:488: Size 768 occurs 114 times [18:30:26] src/kvstore/././comm_tree.h:488: Size 1536 occurs 2 times [18:30:26] src/kvstore/././comm_tree.h:488: Size 3072 occurs 12 times [18:30:26] src/kvstore/././comm_tree.h:488: Size 30522 occurs 1 times [18:30:26] src/kvstore/././comm_tree.h:488: Size 393216 occurs 1 times [18:30:26] src/kvstore/././comm_tree.h:488: Size 589824 occurs 50 times [18:30:26] src/kvstore/././comm_tree.h:488: Size 2359296 occurs 24 times [18:30:26] src/kvstore/././comm_tree.h:488: Size 23440896 occurs 1 times INFO:root:overflow detected. set loss_scale = 16384.0 INFO:root:overflow detected. set loss_scale = 8192.0 INFO:root:overflow detected. set loss_scale = 4096.0 INFO:root:overflow detected. set loss_scale = 2048.0 INFO:root:overflow detected. set loss_scale = 1024.0 INFO:root:[step 249] mlm_loss=9.24962 mlm_acc=5.01887 nsp_loss=0.68673 nsp_acc=54.751 throughput=122.0K tks/s lr=0.0000025 time=163.24 INFO:root:[step 499] mlm_loss=8.19401 mlm_acc=6.20519 nsp_loss=0.68434 nsp_acc=55.795 throughput=124.0K tks/s lr=0.0000050 time=108.43 INFO:root:[step 749] mlm_loss=7.33075 mlm_acc=8.23712 nsp_loss=0.68531 nsp_acc=54.452 throughput=140.0K tks/s lr=0.0000075 time=140.77 INFO:root:[step 999] mlm_loss=7.10765 mlm_acc=9.11098 nsp_loss=0.65776 nsp_acc=58.997 throughput=127.0K tks/s lr=0.0000100 time=113.12 INFO:root:[step 1249] mlm_loss=7.02303 mlm_acc=9.54828 nsp_loss=0.61480 nsp_acc=63.509 throughput=123.0K tks/s lr=0.0000125 time=120.87 INFO:root:[step 1499] mlm_loss=6.94200 mlm_acc=10.12084 nsp_loss=0.61056 nsp_acc=63.813 throughput=140.0K tks/s lr=0.0000150 time=122.08 INFO:root:[step 1749] mlm_loss=6.60900 mlm_acc=11.67967 nsp_loss=0.62407 nsp_acc=61.016 throughput=150.0K tks/s lr=0.0000175 time=157.78 INFO:root:[step 1999] mlm_loss=6.66644 mlm_acc=11.80617 nsp_loss=0.63280 nsp_acc=61.529 throughput=151.0K tks/s lr=0.0000200 time=149.24 INFO:root:[step 2249] mlm_loss=6.81814 mlm_acc=11.68211 nsp_loss=0.58774 nsp_acc=66.839 throughput=134.0K tks/s lr=0.0000225 time=135.36 INFO:root:[step 2499] mlm_loss=6.66386 mlm_acc=12.34327 nsp_loss=0.53046 nsp_acc=71.784 throughput=120.0K tks/s lr=0.0000250 time=106.67 INFO:root:[step 2749] mlm_loss=6.70937 mlm_acc=12.59501 nsp_loss=0.51380 nsp_acc=73.518 throughput=124.0K tks/s lr=0.0000275 time=110.49 INFO:root:[step 2999] mlm_loss=6.56966 mlm_acc=13.05192 nsp_loss=0.47944 nsp_acc=75.961 throughput=111.0K tks/s lr=0.0000300 time=118.18 INFO:root:[step 3249] mlm_loss=6.58960 mlm_acc=13.09013 nsp_loss=0.49284 nsp_acc=74.973 throughput=138.0K tks/s lr=0.0000325 time=117.46 INFO:root:[step 3499] mlm_loss=6.58534 mlm_acc=13.25706 nsp_loss=0.46531 nsp_acc=77.106 throughput=131.0K tks/s lr=0.0000350 time=130.38 INFO:root:[step 3749] mlm_loss=6.28094 mlm_acc=13.71884 nsp_loss=0.51207 nsp_acc=73.258 throughput=144.0K tks/s lr=0.0000375 time=143.71 INFO:root:[step 3999] mlm_loss=6.24885 mlm_acc=13.85473 nsp_loss=0.50803 nsp_acc=72.861 throughput=152.0K tks/s lr=0.0000400 time=147.59 INFO:root:[step 4249] mlm_loss=6.37051 mlm_acc=13.99126 nsp_loss=0.42434 nsp_acc=79.779 throughput=131.0K tks/s lr=0.0000425 time=129.17 INFO:root:[step 4499] mlm_loss=6.33056 mlm_acc=13.96524 nsp_loss=0.40867 nsp_acc=80.454 throughput=131.0K tks/s lr=0.0000450 time=136.79 INFO:root:[step 4749] mlm_loss=6.44407 mlm_acc=13.91319 nsp_loss=0.37792 nsp_acc=82.457 throughput=119.0K tks/s lr=0.0000475 time=141.86 INFO:root:[step 4999] mlm_loss=6.34793 mlm_acc=14.35129 nsp_loss=0.34620 nsp_acc=84.570 throughput=116.0K tks/s lr=0.0000500 time=126.67 INFO:root:[step 4999] Saving checkpoints to /home/ubuntu/ckpt-master/0004999.params, /home/ubuntu/ckpt-master/0004999.states. INFO:root:[step 5249] mlm_loss=6.10379 mlm_acc=14.57130 nsp_loss=0.42890 nsp_acc=78.174 throughput=119.0K tks/s lr=0.0000525 time=165.80 INFO:root:[step 5499] mlm_loss=6.17369 mlm_acc=14.70321 nsp_loss=0.41912 nsp_acc=79.347 throughput=136.0K tks/s lr=0.0000550 time=144.45 INFO:root:[step 5749] mlm_loss=6.32352 mlm_acc=14.66357 nsp_loss=0.31973 nsp_acc=85.963 throughput=126.0K tks/s lr=0.0000575 time=121.34 INFO:root:[step 5999] mlm_loss=6.35760 mlm_acc=14.48697 nsp_loss=0.33205 nsp_acc=85.537 throughput=134.0K tks/s lr=0.0000600 time=140.98 INFO:root:overflow detected. set loss_scale = 512.0 INFO:root:[step 6249] mlm_loss=6.35097 mlm_acc=14.49889 nsp_loss=0.33935 nsp_acc=84.923 throughput=141.0K tks/s lr=0.0000625 time=152.52 INFO:root:[step 6499] mlm_loss=5.83697 mlm_acc=15.30754 nsp_loss=0.39578 nsp_acc=80.854 throughput=139.0K tks/s lr=0.0000650 time=127.93 INFO:root:[step 6749] mlm_loss=6.03047 mlm_acc=15.07474 nsp_loss=0.39430 nsp_acc=80.884 throughput=146.0K tks/s lr=0.0000675 time=148.27 INFO:root:[step 6999] mlm_loss=6.25431 mlm_acc=14.91075 nsp_loss=0.31190 nsp_acc=86.314 throughput=141.0K tks/s lr=0.0000700 time=144.82 INFO:root:[step 7249] mlm_loss=6.26756 mlm_acc=15.06087 nsp_loss=0.28475 nsp_acc=87.829 throughput=142.0K tks/s lr=0.0000725 time=153.33 INFO:root:[step 7499] mlm_loss=6.07040 mlm_acc=15.72072 nsp_loss=0.26277 nsp_acc=88.871 throughput=129.0K tks/s lr=0.0000750 time=115.97 INFO:root:[step 7749] mlm_loss=5.88694 mlm_acc=15.76536 nsp_loss=0.40010 nsp_acc=80.387 throughput=143.0K tks/s lr=0.0000775 time=137.06 INFO:root:[step 7999] mlm_loss=5.89273 mlm_acc=15.77247 nsp_loss=0.38653 nsp_acc=81.270 throughput=152.0K tks/s lr=0.0000800 time=153.08 INFO:root:[step 8249] mlm_loss=5.96746 mlm_acc=15.65581 nsp_loss=0.40057 nsp_acc=80.791 throughput=147.0K tks/s lr=0.0000825 time=158.42 INFO:root:[step 8499] mlm_loss=5.61746 mlm_acc=17.52625 nsp_loss=0.29400 nsp_acc=86.866 throughput=133.0K tks/s lr=0.0000850 time=124.48 INFO:root:[step 8749] mlm_loss=5.64756 mlm_acc=18.43149 nsp_loss=0.23252 nsp_acc=90.495 throughput=115.0K tks/s lr=0.0000875 time=117.50 INFO:root:[step 8999] mlm_loss=5.77620 mlm_acc=18.76604 nsp_loss=0.24259 nsp_acc=90.038 throughput=141.0K tks/s lr=0.0000900 time=125.06 INFO:root:[step 9249] mlm_loss=5.29787 mlm_acc=21.28720 nsp_loss=0.44799 nsp_acc=77.831 throughput=150.0K tks/s lr=0.0000925 time=168.44 INFO:root:[step 9499] mlm_loss=4.91604 mlm_acc=24.65914 nsp_loss=0.35247 nsp_acc=83.277 throughput=135.0K tks/s lr=0.0000950 time=134.32 INFO:root:[step 9749] mlm_loss=4.97408 mlm_acc=25.54348 nsp_loss=0.22094 nsp_acc=90.867 throughput=121.0K tks/s lr=0.0000975 time=118.98 INFO:root:[step 9999] mlm_loss=4.74977 mlm_acc=28.34388 nsp_loss=0.20558 nsp_acc=91.594 throughput=129.0K tks/s lr=0.0001000 time=114.67 INFO:root:[step 9999] Saving checkpoints to /home/ubuntu/ckpt-master/0009999.params, /home/ubuntu/ckpt-master/0009999.states. INFO:root:[step 10249] mlm_loss=4.69173 mlm_acc=28.45913 nsp_loss=0.25481 nsp_acc=88.965 throughput=118.0K tks/s lr=0.0000990 time=172.79 INFO:root:[step 10499] mlm_loss=3.88145 mlm_acc=33.41813 nsp_loss=0.23316 nsp_acc=90.071 throughput=128.0K tks/s lr=0.0000990 time=114.16 INFO:root:[step 10749] mlm_loss=4.21782 mlm_acc=32.81286 nsp_loss=0.23693 nsp_acc=89.780 throughput=130.0K tks/s lr=0.0000989 time=131.53 INFO:root:[step 10999] mlm_loss=4.05470 mlm_acc=33.45309 nsp_loss=0.34097 nsp_acc=84.033 throughput=145.0K tks/s lr=0.0000989 time=150.24 INFO:root:[step 11249] mlm_loss=4.42531 mlm_acc=31.94107 nsp_loss=0.15972 nsp_acc=93.588 throughput=136.0K tks/s lr=0.0000989 time=137.28 INFO:root:[step 11499] mlm_loss=3.92384 mlm_acc=35.34821 nsp_loss=0.26810 nsp_acc=87.407 throughput=145.0K tks/s lr=0.0000989 time=133.21 INFO:root:[step 11749] mlm_loss=3.95973 mlm_acc=35.69644 nsp_loss=0.14502 nsp_acc=94.074 throughput=111.0K tks/s lr=0.0000988 time=120.91 INFO:root:[step 11999] mlm_loss=3.96150 mlm_acc=36.19118 nsp_loss=0.17180 nsp_acc=92.883 throughput=140.0K tks/s lr=0.0000988 time=136.68 INFO:root:[step 12249] mlm_loss=3.80372 mlm_acc=37.85625 nsp_loss=0.20134 nsp_acc=91.446 throughput=140.0K tks/s lr=0.0000988 time=144.05 INFO:root:[step 12499] mlm_loss=3.60721 mlm_acc=39.81622 nsp_loss=0.12610 nsp_acc=94.919 throughput=121.0K tks/s lr=0.0000988 time=110.30 INFO:root:[step 12749] mlm_loss=3.74572 mlm_acc=39.60535 nsp_loss=0.12794 nsp_acc=94.860 throughput=127.0K tks/s lr=0.0000987 time=127.47 INFO:root:[step 12999] mlm_loss=3.38575 mlm_acc=41.28279 nsp_loss=0.16747 nsp_acc=92.870 throughput=137.0K tks/s lr=0.0000987 time=117.16 INFO:root:[step 13249] mlm_loss=3.71028 mlm_acc=39.44776 nsp_loss=0.18743 nsp_acc=91.896 throughput=153.0K tks/s lr=0.0000987 time=154.33 INFO:root:[step 13499] mlm_loss=3.42893 mlm_acc=41.18944 nsp_loss=0.14715 nsp_acc=94.001 throughput=134.0K tks/s lr=0.0000987 time=135.18 INFO:root:[step 13749] mlm_loss=3.30540 mlm_acc=41.49550 nsp_loss=0.27671 nsp_acc=86.875 throughput=146.0K tks/s lr=0.0000986 time=159.52 INFO:root:[step 13999] mlm_loss=3.18660 mlm_acc=43.17579 nsp_loss=0.17868 nsp_acc=92.203 throughput=134.0K tks/s lr=0.0000986 time=127.80 INFO:root:[step 14249] mlm_loss=3.26912 mlm_acc=43.85207 nsp_loss=0.11158 nsp_acc=95.544 throughput=113.0K tks/s lr=0.0000986 time=118.93 INFO:root:[step 14499] mlm_loss=3.15502 mlm_acc=44.98965 nsp_loss=0.10874 nsp_acc=95.732 throughput=119.0K tks/s lr=0.0000986 time=110.68 INFO:root:[step 14749] mlm_loss=3.17752 mlm_acc=45.47977 nsp_loss=0.11401 nsp_acc=95.455 throughput=125.0K tks/s lr=0.0000985 time=110.70 INFO:root:[step 14999] mlm_loss=3.43249 mlm_acc=43.82970 nsp_loss=0.10487 nsp_acc=95.786 throughput=138.0K tks/s lr=0.0000985 time=135.45 INFO:root:[step 14999] Saving checkpoints to /home/ubuntu/ckpt-master/0014999.params, /home/ubuntu/ckpt-master/0014999.states. INFO:root:[step 15249] mlm_loss=2.79499 mlm_acc=48.08410 nsp_loss=0.10587 nsp_acc=95.945 throughput=92.0K tks/s lr=0.0000985 time=124.93 INFO:root:[step 15499] mlm_loss=3.13775 mlm_acc=45.79923 nsp_loss=0.10704 nsp_acc=95.824 throughput=120.0K tks/s lr=0.0000985 time=125.66 INFO:root:[step 15749] mlm_loss=3.20607 mlm_acc=44.06169 nsp_loss=0.17094 nsp_acc=92.692 throughput=141.0K tks/s lr=0.0000984 time=140.64 INFO:root:[step 15999] mlm_loss=3.07678 mlm_acc=46.77482 nsp_loss=0.10412 nsp_acc=95.784 throughput=124.0K tks/s lr=0.0000984 time=117.60 INFO:root:[step 16249] mlm_loss=3.20485 mlm_acc=42.99788 nsp_loss=0.17287 nsp_acc=92.881 throughput=154.0K tks/s lr=0.0000984 time=154.49 INFO:root:[step 16499] mlm_loss=3.00407 mlm_acc=46.85820 nsp_loss=0.10287 nsp_acc=96.074 throughput=117.0K tks/s lr=0.0000984 time=123.06 INFO:root:[step 16749] mlm_loss=3.19774 mlm_acc=44.98059 nsp_loss=0.12299 nsp_acc=95.050 throughput=147.0K tks/s lr=0.0000983 time=143.65 INFO:root:[step 16999] mlm_loss=3.12970 mlm_acc=45.24535 nsp_loss=0.14812 nsp_acc=93.849 throughput=156.0K tks/s lr=0.0000983 time=159.04 INFO:root:[step 17249] mlm_loss=2.92400 mlm_acc=47.91387 nsp_loss=0.11004 nsp_acc=95.652 throughput=114.0K tks/s lr=0.0000983 time=122.47 INFO:root:[step 17499] mlm_loss=3.04736 mlm_acc=47.23758 nsp_loss=0.09463 nsp_acc=96.357 throughput=136.0K tks/s lr=0.0000983 time=120.17 INFO:root:[step 17749] mlm_loss=2.95884 mlm_acc=45.87974 nsp_loss=0.23316 nsp_acc=89.596 throughput=146.0K tks/s lr=0.0000982 time=162.15 INFO:root:[step 17999] mlm_loss=2.92234 mlm_acc=48.24828 nsp_loss=0.09977 nsp_acc=96.044 throughput=130.0K tks/s lr=0.0000982 time=110.75 INFO:root:[step 18249] mlm_loss=3.14746 mlm_acc=46.47178 nsp_loss=0.13876 nsp_acc=94.071 throughput=142.0K tks/s lr=0.0000982 time=136.91 INFO:root:[step 18499] mlm_loss=3.09619 mlm_acc=45.15179 nsp_loss=0.20924 nsp_acc=90.884 throughput=144.0K tks/s lr=0.0000982 time=150.10 INFO:root:[step 18749] mlm_loss=3.02326 mlm_acc=46.44832 nsp_loss=0.11910 nsp_acc=95.144 throughput=127.0K tks/s lr=0.0000981 time=116.25 INFO:root:[step 18999] mlm_loss=2.79279 mlm_acc=49.62597 nsp_loss=0.09835 nsp_acc=96.123 throughput=114.0K tks/s lr=0.0000981 time=116.99 INFO:root:[step 19249] mlm_loss=2.98351 mlm_acc=48.19634 nsp_loss=0.09614 nsp_acc=96.216 throughput=135.0K tks/s lr=0.0000981 time=116.11 INFO:root:[step 19499] mlm_loss=2.94957 mlm_acc=47.02392 nsp_loss=0.13354 nsp_acc=94.499 throughput=143.0K tks/s lr=0.0000981 time=141.00 INFO:root:[step 19749] mlm_loss=2.67584 mlm_acc=50.73501 nsp_loss=0.08902 nsp_acc=96.529 throughput=114.0K tks/s lr=0.0000980 time=112.65 INFO:root:[step 19999] mlm_loss=2.90303 mlm_acc=48.57758 nsp_loss=0.09145 nsp_acc=96.416 throughput=139.0K tks/s lr=0.0000980 time=123.54 INFO:root:[step 19999] Saving checkpoints to /home/ubuntu/ckpt-master/0019999.params, /home/ubuntu/ckpt-master/0019999.states. INFO:root:[step 20249] mlm_loss=3.02376 mlm_acc=46.32201 nsp_loss=0.10981 nsp_acc=95.607 throughput=129.0K tks/s lr=0.0000980 time=159.01 INFO:root:[step 20499] mlm_loss=2.82755 mlm_acc=49.50975 nsp_loss=0.09966 nsp_acc=96.100 throughput=125.0K tks/s lr=0.0000980 time=127.08 INFO:root:[step 20749] mlm_loss=2.77075 mlm_acc=49.86758 nsp_loss=0.09059 nsp_acc=96.479 throughput=127.0K tks/s lr=0.0000979 time=111.23 INFO:root:[step 20999] mlm_loss=2.95397 mlm_acc=49.00948 nsp_loss=0.09002 nsp_acc=96.455 throughput=132.0K tks/s lr=0.0000979 time=128.29 INFO:root:[step 21249] mlm_loss=2.63477 mlm_acc=51.24469 nsp_loss=0.08909 nsp_acc=96.595 throughput=121.0K tks/s lr=0.0000979 time=108.39 INFO:root:[step 21499] mlm_loss=2.47106 mlm_acc=52.32215 nsp_loss=0.08694 nsp_acc=96.705 throughput=105.0K tks/s lr=0.0000979 time=115.97 INFO:root:[step 21749] mlm_loss=2.77182 mlm_acc=47.80118 nsp_loss=0.13010 nsp_acc=94.692 throughput=145.0K tks/s lr=0.0000978 time=125.31 INFO:root:[step 21999] mlm_loss=2.97440 mlm_acc=47.04771 nsp_loss=0.14011 nsp_acc=94.017 throughput=146.0K tks/s lr=0.0000978 time=144.29 INFO:root:[step 22249] mlm_loss=2.84819 mlm_acc=49.75539 nsp_loss=0.08506 nsp_acc=96.659 throughput=132.0K tks/s lr=0.0000978 time=131.08 INFO:root:[step 22499] mlm_loss=2.47991 mlm_acc=51.63803 nsp_loss=0.09898 nsp_acc=96.102 throughput=110.0K tks/s lr=0.0000978 time=107.52 INFO:root:[step 22749] mlm_loss=2.45411 mlm_acc=52.53032 nsp_loss=0.08889 nsp_acc=96.567 throughput=107.0K tks/s lr=0.0000977 time=115.97 INFO:root:[step 22999] mlm_loss=2.60504 mlm_acc=51.65700 nsp_loss=0.09705 nsp_acc=96.175 throughput=119.0K tks/s lr=0.0000977 time=108.24 INFO:root:[step 23249] mlm_loss=2.63496 mlm_acc=51.61097 nsp_loss=0.08503 nsp_acc=96.671 throughput=126.0K tks/s lr=0.0000977 time=110.59 INFO:root:[step 23499] mlm_loss=2.57153 mlm_acc=51.71020 nsp_loss=0.08730 nsp_acc=96.626 throughput=110.0K tks/s lr=0.0000977 time=122.39 INFO:root:[step 23749] mlm_loss=2.67650 mlm_acc=48.89553 nsp_loss=0.12377 nsp_acc=94.982 throughput=144.0K tks/s lr=0.0000976 time=129.53 INFO:root:[step 23999] mlm_loss=2.57794 mlm_acc=49.69146 nsp_loss=0.13747 nsp_acc=94.375 throughput=134.0K tks/s lr=0.0000976 time=134.52 INFO:root:[step 24249] mlm_loss=2.56224 mlm_acc=53.37231 nsp_loss=0.17289 nsp_acc=92.925 throughput=150.0K tks/s lr=0.0000976 time=150.24 INFO:root:[step 24499] mlm_loss=2.93617 mlm_acc=48.25845 nsp_loss=0.12211 nsp_acc=94.992 throughput=148.0K tks/s lr=0.0000976 time=160.10 INFO:root:[step 24749] mlm_loss=2.68284 mlm_acc=51.26631 nsp_loss=0.08140 nsp_acc=96.835 throughput=134.0K tks/s lr=0.0000975 time=120.28 INFO:root:[step 24999] mlm_loss=2.51830 mlm_acc=52.75433 nsp_loss=0.08509 nsp_acc=96.704 throughput=116.0K tks/s lr=0.0000975 time=115.97 INFO:root:[step 24999] Saving checkpoints to /home/ubuntu/ckpt-master/0024999.params, /home/ubuntu/ckpt-master/0024999.states. INFO:root:[step 25249] mlm_loss=2.63802 mlm_acc=51.82565 nsp_loss=0.08219 nsp_acc=96.838 throughput=109.0K tks/s lr=0.0000975 time=135.98 INFO:root:[step 25499] mlm_loss=2.67416 mlm_acc=50.48222 nsp_loss=0.17588 nsp_acc=92.351 throughput=136.0K tks/s lr=0.0000975 time=136.84 INFO:root:[step 25749] mlm_loss=2.74081 mlm_acc=50.73164 nsp_loss=0.08344 nsp_acc=96.790 throughput=135.0K tks/s lr=0.0000974 time=132.96 INFO:root:[step 25999] mlm_loss=2.49793 mlm_acc=52.98010 nsp_loss=0.08179 nsp_acc=96.981 throughput=124.0K tks/s lr=0.0000974 time=111.73 INFO:root:[step 26249] mlm_loss=2.72292 mlm_acc=49.58928 nsp_loss=0.12862 nsp_acc=94.613 throughput=152.0K tks/s lr=0.0000974 time=148.76 INFO:root:[step 26499] mlm_loss=2.62275 mlm_acc=52.03870 nsp_loss=0.08473 nsp_acc=96.716 throughput=124.0K tks/s lr=0.0000974 time=127.01 INFO:root:[step 26749] mlm_loss=2.58009 mlm_acc=52.44536 nsp_loss=0.08366 nsp_acc=96.815 throughput=132.0K tks/s lr=0.0000973 time=112.73 INFO:root:[step 26999] mlm_loss=2.81359 mlm_acc=48.31377 nsp_loss=0.15767 nsp_acc=93.324 throughput=146.0K tks/s lr=0.0000973 time=161.93 INFO:root:[step 27249] mlm_loss=2.48337 mlm_acc=53.17681 nsp_loss=0.08081 nsp_acc=96.915 throughput=124.0K tks/s lr=0.0000973 time=109.23 INFO:root:[step 27499] mlm_loss=2.71858 mlm_acc=51.31392 nsp_loss=0.08187 nsp_acc=96.809 throughput=140.0K tks/s lr=0.0000973 time=133.59 INFO:root:[step 27749] mlm_loss=2.64182 mlm_acc=50.85505 nsp_loss=0.17476 nsp_acc=92.275 throughput=140.0K tks/s lr=0.0000972 time=138.78 INFO:root:[step 27999] mlm_loss=2.67642 mlm_acc=50.44847 nsp_loss=0.10089 nsp_acc=95.959 throughput=146.0K tks/s lr=0.0000972 time=143.01 INFO:root:[step 28249] mlm_loss=2.48491 mlm_acc=52.96541 nsp_loss=0.07990 nsp_acc=97.027 throughput=130.0K tks/s lr=0.0000972 time=118.59 INFO:root:[step 28499] mlm_loss=2.74263 mlm_acc=51.62462 nsp_loss=0.08258 nsp_acc=96.808 throughput=139.0K tks/s lr=0.0000972 time=135.08 INFO:root:[step 28749] mlm_loss=2.54885 mlm_acc=52.80457 nsp_loss=0.08302 nsp_acc=96.775 throughput=121.0K tks/s lr=0.0000971 time=123.16 INFO:root:[step 28999] mlm_loss=2.51579 mlm_acc=53.00553 nsp_loss=0.08172 nsp_acc=96.909 throughput=130.0K tks/s lr=0.0000971 time=116.20 INFO:root:[step 29249] mlm_loss=2.63260 mlm_acc=52.45491 nsp_loss=0.07841 nsp_acc=96.965 throughput=130.0K tks/s lr=0.0000971 time=128.49 INFO:root:[step 29499] mlm_loss=2.61169 mlm_acc=52.16152 nsp_loss=0.07968 nsp_acc=96.912 throughput=134.0K tks/s lr=0.0000971 time=130.77 INFO:root:[step 29749] mlm_loss=2.43542 mlm_acc=54.29602 nsp_loss=0.07969 nsp_acc=96.896 throughput=121.0K tks/s lr=0.0000970 time=111.43 INFO:root:[step 29999] mlm_loss=2.75124 mlm_acc=50.06272 nsp_loss=0.10914 nsp_acc=95.457 throughput=144.0K tks/s lr=0.0000970 time=142.74 INFO:root:[step 29999] Saving checkpoints to /home/ubuntu/ckpt-master/0029999.params, /home/ubuntu/ckpt-master/0029999.states. INFO:root:[step 30249] mlm_loss=2.47535 mlm_acc=51.95071 nsp_loss=0.11756 nsp_acc=95.167 throughput=115.0K tks/s lr=0.0000970 time=150.02 INFO:root:[step 30499] mlm_loss=2.48886 mlm_acc=52.87544 nsp_loss=0.11408 nsp_acc=95.249 throughput=128.0K tks/s lr=0.0000970 time=131.20 INFO:root:[step 30749] mlm_loss=2.55019 mlm_acc=51.98107 nsp_loss=0.13628 nsp_acc=94.381 throughput=141.0K tks/s lr=0.0000969 time=125.19 INFO:root:[step 30999] mlm_loss=2.59380 mlm_acc=51.87783 nsp_loss=0.14796 nsp_acc=93.754 throughput=144.0K tks/s lr=0.0000969 time=140.80 INFO:root:[step 31249] mlm_loss=2.57384 mlm_acc=51.73675 nsp_loss=0.12306 nsp_acc=94.903 throughput=148.0K tks/s lr=0.0000969 time=146.24 INFO:root:[step 31499] mlm_loss=2.63179 mlm_acc=51.57494 nsp_loss=0.12039 nsp_acc=94.854 throughput=142.0K tks/s lr=0.0000969 time=136.61 INFO:root:[step 31749] mlm_loss=2.76106 mlm_acc=48.60183 nsp_loss=0.15465 nsp_acc=93.526 throughput=149.0K tks/s lr=0.0000968 time=166.84 INFO:root:[step 31999] mlm_loss=2.40264 mlm_acc=54.51310 nsp_loss=0.07970 nsp_acc=96.833 throughput=126.0K tks/s lr=0.0000968 time=110.56 INFO:root:[step 32249] mlm_loss=2.47634 mlm_acc=54.83684 nsp_loss=0.10455 nsp_acc=95.976 throughput=130.0K tks/s lr=0.0000968 time=126.50 INFO:root:[step 32499] mlm_loss=1.99523 mlm_acc=63.61844 nsp_loss=0.11922 nsp_acc=95.303 throughput=141.0K tks/s lr=0.0000968 time=127.12 INFO:root:[step 32749] mlm_loss=2.33889 mlm_acc=54.92948 nsp_loss=0.08650 nsp_acc=96.639 throughput=115.0K tks/s lr=0.0000967 time=119.46 INFO:root:[step 32999] mlm_loss=2.30915 mlm_acc=55.55732 nsp_loss=0.07861 nsp_acc=97.070 throughput=118.0K tks/s lr=0.0000967 time=106.53 INFO:root:[step 33249] mlm_loss=2.44475 mlm_acc=54.34965 nsp_loss=0.07861 nsp_acc=96.956 throughput=133.0K tks/s lr=0.0000967 time=114.52 INFO:root:[step 33499] mlm_loss=2.36870 mlm_acc=54.91144 nsp_loss=0.07609 nsp_acc=97.106 throughput=115.0K tks/s lr=0.0000967 time=119.52 INFO:root:[step 33749] mlm_loss=2.30416 mlm_acc=54.78583 nsp_loss=0.08961 nsp_acc=96.567 throughput=119.0K tks/s lr=0.0000966 time=110.64 INFO:root:[step 33999] mlm_loss=2.22795 mlm_acc=55.85691 nsp_loss=0.07666 nsp_acc=97.079 throughput=119.0K tks/s lr=0.0000966 time=107.92 INFO:root:[step 34249] mlm_loss=2.62342 mlm_acc=51.01186 nsp_loss=0.10364 nsp_acc=95.823 throughput=143.0K tks/s lr=0.0000966 time=157.58 INFO:root:[step 34499] mlm_loss=2.21946 mlm_acc=56.06004 nsp_loss=0.08086 nsp_acc=96.993 throughput=119.0K tks/s lr=0.0000966 time=109.53 INFO:root:[step 34749] mlm_loss=2.49114 mlm_acc=53.38293 nsp_loss=0.07516 nsp_acc=97.073 throughput=136.0K tks/s lr=0.0000965 time=132.00 INFO:root:[step 34999] mlm_loss=2.62715 mlm_acc=52.72067 nsp_loss=0.07597 nsp_acc=97.131 throughput=145.0K tks/s lr=0.0000965 time=138.74 INFO:root:[step 34999] Saving checkpoints to /home/ubuntu/ckpt-master/0034999.params, /home/ubuntu/ckpt-master/0034999.states. INFO:root:[step 35249] mlm_loss=2.56986 mlm_acc=51.77698 nsp_loss=0.09837 nsp_acc=96.071 throughput=132.0K tks/s lr=0.0000965 time=168.30 INFO:root:[step 35499] mlm_loss=2.57988 mlm_acc=52.09941 nsp_loss=0.10579 nsp_acc=95.710 throughput=150.0K tks/s lr=0.0000965 time=147.11 INFO:root:[step 35749] mlm_loss=2.60978 mlm_acc=52.05011 nsp_loss=0.19452 nsp_acc=91.174 throughput=140.0K tks/s lr=0.0000964 time=136.13 INFO:root:[step 35999] mlm_loss=2.48243 mlm_acc=53.78433 nsp_loss=0.08439 nsp_acc=96.675 throughput=134.0K tks/s lr=0.0000964 time=131.36 INFO:root:[step 36249] mlm_loss=2.30933 mlm_acc=56.67536 nsp_loss=0.12746 nsp_acc=94.893 throughput=152.0K tks/s lr=0.0000964 time=148.42 INFO:root:[step 36499] mlm_loss=2.05191 mlm_acc=62.32970 nsp_loss=0.09813 nsp_acc=96.309 throughput=133.0K tks/s lr=0.0000964 time=129.12 INFO:root:[step 36749] mlm_loss=2.48923 mlm_acc=52.81466 nsp_loss=0.14091 nsp_acc=94.022 throughput=144.0K tks/s lr=0.0000963 time=146.54 INFO:root:[step 36999] mlm_loss=2.58465 mlm_acc=51.12189 nsp_loss=0.22931 nsp_acc=89.659 throughput=144.0K tks/s lr=0.0000963 time=145.81 INFO:root:[step 37249] mlm_loss=2.24871 mlm_acc=55.70045 nsp_loss=0.08079 nsp_acc=96.962 throughput=117.0K tks/s lr=0.0000963 time=111.33 INFO:root:[step 37499] mlm_loss=2.15755 mlm_acc=56.20396 nsp_loss=0.08038 nsp_acc=96.961 throughput=123.0K tks/s lr=0.0000963 time=111.07 INFO:root:[step 37749] mlm_loss=2.48601 mlm_acc=54.67770 nsp_loss=0.07750 nsp_acc=96.933 throughput=139.0K tks/s lr=0.0000962 time=133.09 INFO:root:[step 37999] mlm_loss=2.56776 mlm_acc=52.53003 nsp_loss=0.12225 nsp_acc=94.942 throughput=151.0K tks/s lr=0.0000962 time=162.50 INFO:root:[step 38249] mlm_loss=2.56475 mlm_acc=52.66727 nsp_loss=0.11226 nsp_acc=95.468 throughput=155.0K tks/s lr=0.0000962 time=150.96 INFO:root:[step 38499] mlm_loss=2.47870 mlm_acc=53.01638 nsp_loss=0.11214 nsp_acc=95.408 throughput=146.0K tks/s lr=0.0000962 time=146.10 INFO:root:[step 38749] mlm_loss=2.12940 mlm_acc=56.52495 nsp_loss=0.07851 nsp_acc=97.062 throughput=119.0K tks/s lr=0.0000961 time=109.04 INFO:root:[step 38999] mlm_loss=2.13080 mlm_acc=57.11725 nsp_loss=0.07534 nsp_acc=97.109 throughput=114.0K tks/s lr=0.0000961 time=102.88 INFO:root:[step 39249] mlm_loss=2.47159 mlm_acc=54.42108 nsp_loss=0.07775 nsp_acc=97.026 throughput=135.0K tks/s lr=0.0000961 time=126.76 INFO:root:[step 39499] mlm_loss=2.31155 mlm_acc=55.62284 nsp_loss=0.07357 nsp_acc=97.204 throughput=121.0K tks/s lr=0.0000961 time=119.58 INFO:root:[step 39749] mlm_loss=2.44172 mlm_acc=54.60995 nsp_loss=0.07355 nsp_acc=97.096 throughput=141.0K tks/s lr=0.0000960 time=125.25 INFO:root:[step 39999] mlm_loss=2.33162 mlm_acc=55.69279 nsp_loss=0.07390 nsp_acc=97.177 throughput=120.0K tks/s lr=0.0000960 time=121.15 INFO:root:[step 39999] Saving checkpoints to /home/ubuntu/ckpt-master/0039999.params, /home/ubuntu/ckpt-master/0039999.states. INFO:root:[step 40249] mlm_loss=2.24810 mlm_acc=56.13896 nsp_loss=0.07310 nsp_acc=97.237 throughput=111.0K tks/s lr=0.0000960 time=125.74 INFO:root:[step 40499] mlm_loss=2.26530 mlm_acc=55.90365 nsp_loss=0.07367 nsp_acc=97.320 throughput=119.0K tks/s lr=0.0000960 time=115.95 INFO:root:[step 40749] mlm_loss=2.50216 mlm_acc=52.18527 nsp_loss=0.19043 nsp_acc=91.186 throughput=149.0K tks/s lr=0.0000959 time=148.28 INFO:root:[step 40999] mlm_loss=2.29877 mlm_acc=54.78348 nsp_loss=0.13527 nsp_acc=94.170 throughput=139.0K tks/s lr=0.0000959 time=123.35 INFO:root:[step 41249] mlm_loss=2.68342 mlm_acc=50.82919 nsp_loss=0.12768 nsp_acc=94.843 throughput=142.0K tks/s lr=0.0000959 time=137.90 INFO:root:[step 41499] mlm_loss=2.48272 mlm_acc=54.61306 nsp_loss=0.07366 nsp_acc=97.174 throughput=137.0K tks/s lr=0.0000959 time=133.23 INFO:root:[step 41749] mlm_loss=2.34110 mlm_acc=55.46049 nsp_loss=0.07334 nsp_acc=97.239 throughput=125.0K tks/s lr=0.0000958 time=126.65 INFO:root:[step 41999] mlm_loss=2.46696 mlm_acc=52.08039 nsp_loss=0.12228 nsp_acc=95.127 throughput=133.0K tks/s lr=0.0000958 time=119.73 INFO:root:[step 42249] mlm_loss=2.53506 mlm_acc=51.57339 nsp_loss=0.15612 nsp_acc=93.389 throughput=158.0K tks/s lr=0.0000958 time=173.23 INFO:root:[step 42499] mlm_loss=2.36882 mlm_acc=54.66628 nsp_loss=0.10344 nsp_acc=95.913 throughput=130.0K tks/s lr=0.0000958 time=132.65 INFO:root:[step 42749] mlm_loss=2.19302 mlm_acc=57.02929 nsp_loss=0.07369 nsp_acc=97.176 throughput=122.0K tks/s lr=0.0000957 time=106.00 INFO:root:[step 42999] mlm_loss=2.37478 mlm_acc=54.17968 nsp_loss=0.10911 nsp_acc=95.606 throughput=149.0K tks/s lr=0.0000957 time=143.94 INFO:root:[step 43249] mlm_loss=2.27800 mlm_acc=55.61298 nsp_loss=0.06856 nsp_acc=97.476 throughput=124.0K tks/s lr=0.0000957 time=125.39 INFO:root:[step 43499] mlm_loss=2.49678 mlm_acc=53.55514 nsp_loss=0.11447 nsp_acc=95.393 throughput=150.0K tks/s lr=0.0000957 time=144.91 INFO:root:[step 43749] mlm_loss=2.37685 mlm_acc=55.41812 nsp_loss=0.07226 nsp_acc=97.229 throughput=139.0K tks/s lr=0.0000956 time=125.96 INFO:root:[step 43999] mlm_loss=2.40231 mlm_acc=55.79064 nsp_loss=0.07198 nsp_acc=97.337 throughput=142.0K tks/s lr=0.0000956 time=134.46 INFO:root:[step 44249] mlm_loss=2.43760 mlm_acc=53.90113 nsp_loss=0.11883 nsp_acc=95.094 throughput=153.0K tks/s lr=0.0000956 time=163.65 INFO:root:[step 44499] mlm_loss=2.35484 mlm_acc=56.46327 nsp_loss=0.07145 nsp_acc=97.333 throughput=146.0K tks/s lr=0.0000956 time=145.07 INFO:root:[step 44749] mlm_loss=2.16708 mlm_acc=57.29534 nsp_loss=0.07371 nsp_acc=97.181 throughput=122.0K tks/s lr=0.0000955 time=110.89 INFO:root:[step 44999] mlm_loss=2.19396 mlm_acc=55.97533 nsp_loss=0.13316 nsp_acc=94.450 throughput=137.0K tks/s lr=0.0000955 time=138.32 INFO:root:[step 44999] Saving checkpoints to /home/ubuntu/ckpt-master/0044999.params, /home/ubuntu/ckpt-master/0044999.states. INFO:root:[step 45249] mlm_loss=2.33110 mlm_acc=55.06370 nsp_loss=0.07572 nsp_acc=97.110 throughput=119.0K tks/s lr=0.0000955 time=143.00 INFO:root:[step 45499] mlm_loss=2.32147 mlm_acc=54.28179 nsp_loss=0.08096 nsp_acc=96.862 throughput=132.0K tks/s lr=0.0000955 time=136.61 INFO:root:[step 45749] mlm_loss=2.15697 mlm_acc=57.66145 nsp_loss=0.07659 nsp_acc=97.112 throughput=123.0K tks/s lr=0.0000954 time=111.17 INFO:root:[step 45999] mlm_loss=2.05346 mlm_acc=58.90992 nsp_loss=0.07256 nsp_acc=97.284 throughput=119.0K tks/s lr=0.0000954 time=107.93 INFO:root:[step 46249] mlm_loss=2.31263 mlm_acc=55.90071 nsp_loss=0.07191 nsp_acc=97.306 throughput=129.0K tks/s lr=0.0000954 time=127.68 INFO:root:[step 46499] mlm_loss=2.12130 mlm_acc=57.70347 nsp_loss=0.07184 nsp_acc=97.350 throughput=122.0K tks/s lr=0.0000954 time=106.97 INFO:root:[step 46749] mlm_loss=2.14461 mlm_acc=57.83435 nsp_loss=0.07065 nsp_acc=97.385 throughput=117.0K tks/s lr=0.0000953 time=119.54 INFO:root:[step 46999] mlm_loss=2.22329 mlm_acc=56.91414 nsp_loss=0.06879 nsp_acc=97.428 throughput=130.0K tks/s lr=0.0000953 time=112.55 INFO:root:[step 47249] mlm_loss=2.21479 mlm_acc=57.03823 nsp_loss=0.07015 nsp_acc=97.384 throughput=126.0K tks/s lr=0.0000953 time=110.41 INFO:root:[step 47499] mlm_loss=2.41046 mlm_acc=55.30948 nsp_loss=0.06910 nsp_acc=97.315 throughput=138.0K tks/s lr=0.0000953 time=135.27 INFO:root:[step 47749] mlm_loss=2.08534 mlm_acc=57.73859 nsp_loss=0.07013 nsp_acc=97.373 throughput=117.0K tks/s lr=0.0000952 time=114.94 INFO:root:[step 47999] mlm_loss=2.25500 mlm_acc=56.07457 nsp_loss=0.06598 nsp_acc=97.507 throughput=137.0K tks/s lr=0.0000952 time=122.34 INFO:root:[step 48249] mlm_loss=2.35254 mlm_acc=55.34169 nsp_loss=0.06922 nsp_acc=97.349 throughput=134.0K tks/s lr=0.0000952 time=130.21 INFO:root:[step 48499] mlm_loss=2.26996 mlm_acc=56.69973 nsp_loss=0.07141 nsp_acc=97.371 throughput=127.0K tks/s lr=0.0000952 time=124.62 INFO:root:[step 48749] mlm_loss=2.06156 mlm_acc=58.45581 nsp_loss=0.06709 nsp_acc=97.527 throughput=122.0K tks/s lr=0.0000951 time=108.89 INFO:root:[step 48999] mlm_loss=2.08170 mlm_acc=57.82659 nsp_loss=0.07541 nsp_acc=97.081 throughput=115.0K tks/s lr=0.0000951 time=105.32 INFO:root:[step 49249] mlm_loss=2.25675 mlm_acc=57.27419 nsp_loss=0.07891 nsp_acc=97.037 throughput=143.0K tks/s lr=0.0000951 time=137.46 INFO:root:[step 49499] mlm_loss=2.53797 mlm_acc=51.87249 nsp_loss=0.16059 nsp_acc=93.328 throughput=157.0K tks/s lr=0.0000951 time=170.66 INFO:root:[step 49749] mlm_loss=2.37453 mlm_acc=54.51785 nsp_loss=0.08528 nsp_acc=96.736 throughput=137.0K tks/s lr=0.0000950 time=137.59 INFO:root:[step 49999] mlm_loss=2.11709 mlm_acc=58.23596 nsp_loss=0.06844 nsp_acc=97.497 throughput=122.0K tks/s lr=0.0000950 time=107.96 INFO:root:[step 49999] Saving checkpoints to /home/ubuntu/ckpt-master/0049999.params, /home/ubuntu/ckpt-master/0049999.states. INFO:root:[step 50249] mlm_loss=2.02387 mlm_acc=58.71866 nsp_loss=0.06999 nsp_acc=97.282 throughput=102.0K tks/s lr=0.0000950 time=121.97 INFO:root:[step 50499] mlm_loss=2.19087 mlm_acc=57.49451 nsp_loss=0.06536 nsp_acc=97.581 throughput=122.0K tks/s lr=0.0000950 time=124.19 INFO:root:[step 50749] mlm_loss=2.30924 mlm_acc=56.30378 nsp_loss=0.06817 nsp_acc=97.425 throughput=138.0K tks/s lr=0.0000949 time=118.84 INFO:root:[step 50999] mlm_loss=2.44161 mlm_acc=53.80881 nsp_loss=0.14009 nsp_acc=94.039 throughput=148.0K tks/s lr=0.0000949 time=159.59 INFO:root:[step 51249] mlm_loss=2.39877 mlm_acc=53.89912 nsp_loss=0.15209 nsp_acc=93.569 throughput=149.0K tks/s lr=0.0000949 time=160.57 INFO:root:[step 51499] mlm_loss=2.36084 mlm_acc=55.53426 nsp_loss=0.08218 nsp_acc=96.761 throughput=134.0K tks/s lr=0.0000949 time=130.89 INFO:root:[step 51749] mlm_loss=2.55401 mlm_acc=51.65392 nsp_loss=0.15594 nsp_acc=93.594 throughput=154.0K tks/s lr=0.0000948 time=155.47 INFO:root:[step 51999] mlm_loss=2.26665 mlm_acc=55.21978 nsp_loss=0.09575 nsp_acc=96.178 throughput=131.0K tks/s lr=0.0000948 time=132.44 INFO:root:[step 52249] mlm_loss=2.11726 mlm_acc=57.11079 nsp_loss=0.11256 nsp_acc=95.417 throughput=134.0K tks/s lr=0.0000948 time=123.33 INFO:root:[step 52499] mlm_loss=2.34664 mlm_acc=53.99552 nsp_loss=0.08703 nsp_acc=96.641 throughput=139.0K tks/s lr=0.0000948 time=138.30 INFO:root:[step 52749] mlm_loss=2.41845 mlm_acc=53.43794 nsp_loss=0.13000 nsp_acc=94.571 throughput=154.0K tks/s lr=0.0000947 time=152.64 INFO:root:[step 52999] mlm_loss=2.10423 mlm_acc=57.63152 nsp_loss=0.07086 nsp_acc=97.329 throughput=112.0K tks/s lr=0.0000947 time=118.45 INFO:root:[step 53249] mlm_loss=2.37634 mlm_acc=55.98138 nsp_loss=0.06815 nsp_acc=97.373 throughput=139.0K tks/s lr=0.0000947 time=133.97 INFO:root:[step 53499] mlm_loss=2.34760 mlm_acc=55.86914 nsp_loss=0.06540 nsp_acc=97.545 throughput=135.0K tks/s lr=0.0000947 time=133.21 INFO:root:[step 53749] mlm_loss=2.02116 mlm_acc=58.94896 nsp_loss=0.06971 nsp_acc=97.420 throughput=121.0K tks/s lr=0.0000946 time=106.10 INFO:root:[step 53999] mlm_loss=2.21391 mlm_acc=56.46847 nsp_loss=0.07208 nsp_acc=97.298 throughput=132.0K tks/s lr=0.0000946 time=126.97 INFO:root:[step 54249] mlm_loss=2.17919 mlm_acc=55.41699 nsp_loss=0.12255 nsp_acc=95.064 throughput=141.0K tks/s lr=0.0000946 time=135.31 INFO:root:[step 54499] mlm_loss=2.53334 mlm_acc=52.79778 nsp_loss=0.12492 nsp_acc=94.786 throughput=144.0K tks/s lr=0.0000946 time=141.03 INFO:root:[step 54749] mlm_loss=2.32256 mlm_acc=55.97341 nsp_loss=0.07296 nsp_acc=97.210 throughput=132.0K tks/s lr=0.0000945 time=130.52 INFO:root:[step 54999] mlm_loss=2.42256 mlm_acc=53.94886 nsp_loss=0.11013 nsp_acc=95.531 throughput=145.0K tks/s lr=0.0000945 time=139.30 INFO:root:[step 54999] Saving checkpoints to /home/ubuntu/ckpt-master/0054999.params, /home/ubuntu/ckpt-master/0054999.states. INFO:root:[step 55249] mlm_loss=2.23782 mlm_acc=56.80639 nsp_loss=0.07064 nsp_acc=97.355 throughput=113.0K tks/s lr=0.0000945 time=140.55 INFO:root:[step 55499] mlm_loss=2.17010 mlm_acc=57.56896 nsp_loss=0.06655 nsp_acc=97.476 throughput=127.0K tks/s lr=0.0000945 time=115.22 INFO:root:[step 55749] mlm_loss=2.30944 mlm_acc=55.27444 nsp_loss=0.08102 nsp_acc=96.867 throughput=144.0K tks/s lr=0.0000944 time=143.60 INFO:root:[step 55999] mlm_loss=2.44579 mlm_acc=53.82370 nsp_loss=0.13437 nsp_acc=94.496 throughput=154.0K tks/s lr=0.0000944 time=168.72 INFO:root:[step 56249] mlm_loss=2.31249 mlm_acc=55.28348 nsp_loss=0.10066 nsp_acc=96.000 throughput=145.0K tks/s lr=0.0000944 time=144.93 INFO:root:[step 56499] mlm_loss=2.05744 mlm_acc=58.73755 nsp_loss=0.06972 nsp_acc=97.364 throughput=126.0K tks/s lr=0.0000944 time=112.40 INFO:root:[step 56749] mlm_loss=2.25650 mlm_acc=56.14917 nsp_loss=0.11296 nsp_acc=95.311 throughput=138.0K tks/s lr=0.0000943 time=132.59 INFO:root:[step 56999] mlm_loss=2.24238 mlm_acc=56.45272 nsp_loss=0.10379 nsp_acc=95.638 throughput=132.0K tks/s lr=0.0000943 time=132.17 INFO:root:[step 57249] mlm_loss=2.14801 mlm_acc=56.64109 nsp_loss=0.09516 nsp_acc=96.228 throughput=143.0K tks/s lr=0.0000943 time=123.36 INFO:root:[step 57499] mlm_loss=2.21548 mlm_acc=56.26469 nsp_loss=0.07388 nsp_acc=97.225 throughput=134.0K tks/s lr=0.0000943 time=130.87 INFO:root:[step 57749] mlm_loss=2.31803 mlm_acc=55.06442 nsp_loss=0.10554 nsp_acc=95.687 throughput=152.0K tks/s lr=0.0000942 time=158.18 INFO:root:[step 57999] mlm_loss=2.43320 mlm_acc=54.29584 nsp_loss=0.10275 nsp_acc=95.887 throughput=149.0K tks/s lr=0.0000942 time=148.83 INFO:root:[step 58249] mlm_loss=2.37366 mlm_acc=54.61145 nsp_loss=0.10370 nsp_acc=95.653 throughput=159.0K tks/s lr=0.0000942 time=161.38 INFO:root:[step 58499] mlm_loss=2.05234 mlm_acc=58.47238 nsp_loss=0.06818 nsp_acc=97.434 throughput=115.0K tks/s lr=0.0000942 time=119.68 INFO:root:[step 58749] mlm_loss=2.06242 mlm_acc=58.73148 nsp_loss=0.06697 nsp_acc=97.518 throughput=121.0K tks/s lr=0.0000941 time=108.46 INFO:root:[step 58999] mlm_loss=2.01313 mlm_acc=58.51874 nsp_loss=0.07114 nsp_acc=97.386 throughput=123.0K tks/s lr=0.0000941 time=108.60 INFO:root:[step 59249] mlm_loss=2.31190 mlm_acc=55.69331 nsp_loss=0.10868 nsp_acc=95.613 throughput=145.0K tks/s lr=0.0000941 time=139.90 INFO:root:[step 59499] mlm_loss=2.22583 mlm_acc=56.95060 nsp_loss=0.07880 nsp_acc=96.844 throughput=127.0K tks/s lr=0.0000941 time=125.25 INFO:root:[step 59749] mlm_loss=2.21197 mlm_acc=57.03287 nsp_loss=0.06227 nsp_acc=97.655 throughput=132.0K tks/s lr=0.0000940 time=126.36 INFO:root:[step 59999] mlm_loss=2.20031 mlm_acc=55.80872 nsp_loss=0.09835 nsp_acc=95.996 throughput=144.0K tks/s lr=0.0000940 time=125.05 INFO:root:[step 59999] Saving checkpoints to /home/ubuntu/ckpt-master/0059999.params, /home/ubuntu/ckpt-master/0059999.states. INFO:root:[step 60249] mlm_loss=2.13500 mlm_acc=57.06329 nsp_loss=0.09273 nsp_acc=96.316 throughput=113.0K tks/s lr=0.0000940 time=140.40 INFO:root:[step 60499] mlm_loss=2.38929 mlm_acc=54.04841 nsp_loss=0.18417 nsp_acc=91.953 throughput=142.0K tks/s lr=0.0000940 time=141.04 INFO:root:[step 60749] mlm_loss=2.16909 mlm_acc=57.74228 nsp_loss=0.06538 nsp_acc=97.553 throughput=133.0K tks/s lr=0.0000939 time=117.79 INFO:root:[step 60999] mlm_loss=1.77678 mlm_acc=63.59114 nsp_loss=0.14697 nsp_acc=94.158 throughput=151.0K tks/s lr=0.0000939 time=152.49 INFO:root:[step 61249] mlm_loss=2.20815 mlm_acc=55.88510 nsp_loss=0.10349 nsp_acc=95.905 throughput=135.0K tks/s lr=0.0000939 time=136.30 INFO:root:[step 61499] mlm_loss=2.25402 mlm_acc=56.29033 nsp_loss=0.08996 nsp_acc=96.482 throughput=149.0K tks/s lr=0.0000939 time=143.25 INFO:root:[step 61749] mlm_loss=2.04183 mlm_acc=58.70800 nsp_loss=0.07132 nsp_acc=97.354 throughput=107.0K tks/s lr=0.0000938 time=118.94 INFO:root:[step 61999] mlm_loss=1.83222 mlm_acc=60.36189 nsp_loss=0.07134 nsp_acc=97.397 throughput=108.0K tks/s lr=0.0000938 time=101.38 INFO:root:[step 62249] mlm_loss=2.36599 mlm_acc=54.81880 nsp_loss=0.10922 nsp_acc=95.582 throughput=138.0K tks/s lr=0.0000938 time=132.11 INFO:root:[step 62499] mlm_loss=2.37485 mlm_acc=56.18331 nsp_loss=0.06317 nsp_acc=97.508 throughput=147.0K tks/s lr=0.0000938 time=144.39 INFO:root:[step 62999] mlm_loss=4.23979 mlm_acc=58.13270 nsp_loss=0.13004 nsp_acc=97.522 throughput=124.0K tks/s lr=0.0000937 time=235.57 INFO:root:[step 63249] mlm_loss=2.18761 mlm_acc=57.70765 nsp_loss=0.06506 nsp_acc=97.523 throughput=134.0K tks/s lr=0.0000937 time=117.34 INFO:root:[step 63499] mlm_loss=2.26546 mlm_acc=57.33924 nsp_loss=0.06482 nsp_acc=97.524 throughput=138.0K tks/s lr=0.0000937 time=132.33 INFO:root:[step 63749] mlm_loss=2.35897 mlm_acc=56.20919 nsp_loss=0.06163 nsp_acc=97.608 throughput=148.0K tks/s lr=0.0000936 time=143.52 INFO:root:[step 63999] mlm_loss=2.20696 mlm_acc=55.60789 nsp_loss=0.08446 nsp_acc=96.784 throughput=139.0K tks/s lr=0.0000936 time=136.75 INFO:root:[step 64249] mlm_loss=2.01271 mlm_acc=59.59298 nsp_loss=0.06901 nsp_acc=97.464 throughput=110.0K tks/s lr=0.0000936 time=116.39 INFO:root:[step 64499] mlm_loss=1.96870 mlm_acc=59.40524 nsp_loss=0.07376 nsp_acc=97.291 throughput=130.0K tks/s lr=0.0000936 time=112.97 INFO:root:[step 64749] mlm_loss=2.32431 mlm_acc=56.65699 nsp_loss=0.06109 nsp_acc=97.674 throughput=144.0K tks/s lr=0.0000935 time=137.55 INFO:root:[step 64999] mlm_loss=2.32469 mlm_acc=56.59352 nsp_loss=0.05972 nsp_acc=97.699 throughput=149.0K tks/s lr=0.0000935 time=142.56 INFO:root:[step 64999] Saving checkpoints to /home/ubuntu/ckpt-master/0064999.params, /home/ubuntu/ckpt-master/0064999.states. INFO:root:[step 65249] mlm_loss=2.30994 mlm_acc=55.97623 nsp_loss=0.10803 nsp_acc=95.583 throughput=133.0K tks/s lr=0.0000935 time=174.96 INFO:root:[step 65499] mlm_loss=2.10732 mlm_acc=58.80818 nsp_loss=0.06640 nsp_acc=97.501 throughput=126.0K tks/s lr=0.0000935 time=110.62 INFO:root:[step 65749] mlm_loss=2.04500 mlm_acc=58.80227 nsp_loss=0.06746 nsp_acc=97.469 throughput=125.0K tks/s lr=0.0000934 time=113.21 INFO:root:[step 65999] mlm_loss=2.37083 mlm_acc=53.91328 nsp_loss=0.12372 nsp_acc=94.840 throughput=152.0K tks/s lr=0.0000934 time=164.54 INFO:root:[step 66249] mlm_loss=2.03179 mlm_acc=58.23732 nsp_loss=0.11200 nsp_acc=95.540 throughput=137.0K tks/s lr=0.0000934 time=124.65 INFO:root:[step 66499] mlm_loss=2.00790 mlm_acc=59.52007 nsp_loss=0.06374 nsp_acc=97.638 throughput=110.0K tks/s lr=0.0000934 time=117.25 INFO:root:[step 66749] mlm_loss=2.04288 mlm_acc=59.21949 nsp_loss=0.06584 nsp_acc=97.611 throughput=121.0K tks/s lr=0.0000933 time=108.25 INFO:root:[step 66999] mlm_loss=2.05915 mlm_acc=59.02724 nsp_loss=0.06851 nsp_acc=97.434 throughput=127.0K tks/s lr=0.0000933 time=110.38 INFO:root:[step 67249] mlm_loss=2.14489 mlm_acc=58.22868 nsp_loss=0.06799 nsp_acc=97.426 throughput=122.0K tks/s lr=0.0000933 time=124.10 INFO:root:[step 67749] mlm_loss=3.82249 mlm_acc=63.19637 nsp_loss=0.16257 nsp_acc=96.965 throughput=133.0K tks/s lr=0.0000932 time=255.36 INFO:root:[step 67999] mlm_loss=2.18870 mlm_acc=57.36712 nsp_loss=0.06501 nsp_acc=97.580 throughput=133.0K tks/s lr=0.0000932 time=131.21 INFO:root:[step 68249] mlm_loss=2.12727 mlm_acc=57.37817 nsp_loss=0.10385 nsp_acc=95.707 throughput=146.0K tks/s lr=0.0000932 time=144.48 INFO:root:[step 68499] mlm_loss=1.94202 mlm_acc=59.38226 nsp_loss=0.07519 nsp_acc=97.203 throughput=120.0K tks/s lr=0.0000932 time=110.81 INFO:root:[step 68749] mlm_loss=1.97564 mlm_acc=59.11135 nsp_loss=0.08399 nsp_acc=96.686 throughput=118.0K tks/s lr=0.0000931 time=120.15 INFO:root:[step 68999] mlm_loss=2.00585 mlm_acc=58.39696 nsp_loss=0.10298 nsp_acc=95.807 throughput=138.0K tks/s lr=0.0000931 time=124.40 INFO:root:[step 69249] mlm_loss=2.26390 mlm_acc=57.16432 nsp_loss=0.06172 nsp_acc=97.659 throughput=141.0K tks/s lr=0.0000931 time=136.58 INFO:root:[step 69499] mlm_loss=2.22396 mlm_acc=56.44378 nsp_loss=0.14627 nsp_acc=93.720 throughput=135.0K tks/s lr=0.0000931 time=135.49 INFO:root:[step 69749] mlm_loss=2.20815 mlm_acc=56.40594 nsp_loss=0.11972 nsp_acc=95.042 throughput=145.0K tks/s lr=0.0000930 time=144.02 INFO:root:[step 69999] mlm_loss=2.18422 mlm_acc=57.03600 nsp_loss=0.06939 nsp_acc=97.329 throughput=135.0K tks/s lr=0.0000930 time=130.04 INFO:root:[step 69999] Saving checkpoints to /home/ubuntu/ckpt-master/0069999.params, /home/ubuntu/ckpt-master/0069999.states. INFO:root:[step 70249] mlm_loss=2.26878 mlm_acc=56.28280 nsp_loss=0.07116 nsp_acc=97.234 throughput=128.0K tks/s lr=0.0000930 time=158.05 INFO:root:[step 70499] mlm_loss=2.08744 mlm_acc=57.63545 nsp_loss=0.11798 nsp_acc=95.190 throughput=139.0K tks/s lr=0.0000930 time=136.32 INFO:root:[step 70749] mlm_loss=2.19024 mlm_acc=57.60625 nsp_loss=0.06106 nsp_acc=97.727 throughput=132.0K tks/s lr=0.0000929 time=131.16 INFO:root:[step 70999] mlm_loss=2.07357 mlm_acc=58.68063 nsp_loss=0.06346 nsp_acc=97.644 throughput=132.0K tks/s lr=0.0000929 time=115.42 INFO:root:[step 71249] mlm_loss=2.29050 mlm_acc=55.50671 nsp_loss=0.07963 nsp_acc=96.937 throughput=145.0K tks/s lr=0.0000929 time=149.04 INFO:root:[step 71499] mlm_loss=2.09705 mlm_acc=58.93096 nsp_loss=0.06250 nsp_acc=97.628 throughput=125.0K tks/s lr=0.0000929 time=124.16 INFO:root:[step 71749] mlm_loss=2.17598 mlm_acc=58.34876 nsp_loss=0.06221 nsp_acc=97.601 throughput=134.0K tks/s lr=0.0000928 time=131.24 INFO:root:[step 71999] mlm_loss=2.17766 mlm_acc=58.70917 nsp_loss=0.06075 nsp_acc=97.726 throughput=143.0K tks/s lr=0.0000928 time=126.29 INFO:root:[step 72249] mlm_loss=2.19087 mlm_acc=58.24812 nsp_loss=0.06106 nsp_acc=97.701 throughput=132.0K tks/s lr=0.0000928 time=128.70 INFO:root:[step 72499] mlm_loss=1.96559 mlm_acc=59.86841 nsp_loss=0.06531 nsp_acc=97.603 throughput=122.0K tks/s lr=0.0000928 time=108.64 INFO:root:[step 72749] mlm_loss=2.11489 mlm_acc=56.60808 nsp_loss=0.09674 nsp_acc=96.155 throughput=139.0K tks/s lr=0.0000927 time=137.93 INFO:root:[step 72999] mlm_loss=2.15170 mlm_acc=58.06939 nsp_loss=0.06252 nsp_acc=97.723 throughput=129.0K tks/s lr=0.0000927 time=129.82 INFO:root:[step 73249] mlm_loss=2.17452 mlm_acc=58.20810 nsp_loss=0.06319 nsp_acc=97.535 throughput=136.0K tks/s lr=0.0000927 time=130.42 INFO:root:[step 73499] mlm_loss=2.17449 mlm_acc=58.33963 nsp_loss=0.06224 nsp_acc=97.605 throughput=138.0K tks/s lr=0.0000927 time=121.53 INFO:root:[step 73749] mlm_loss=2.18745 mlm_acc=58.11802 nsp_loss=0.06063 nsp_acc=97.710 throughput=137.0K tks/s lr=0.0000926 time=131.83 INFO:root:[step 73999] mlm_loss=2.22266 mlm_acc=56.91977 nsp_loss=0.10667 nsp_acc=95.514 throughput=140.0K tks/s lr=0.0000926 time=134.90 INFO:root:[step 74249] mlm_loss=1.97429 mlm_acc=58.12201 nsp_loss=0.09490 nsp_acc=96.273 throughput=126.0K tks/s lr=0.0000926 time=116.71 INFO:root:[step 74499] mlm_loss=2.10802 mlm_acc=58.74609 nsp_loss=0.06463 nsp_acc=97.623 throughput=122.0K tks/s lr=0.0000926 time=131.32 INFO:root:[step 74749] mlm_loss=1.97530 mlm_acc=59.81099 nsp_loss=0.06368 nsp_acc=97.643 throughput=122.0K tks/s lr=0.0000925 time=109.04 INFO:root:[step 74999] mlm_loss=2.13947 mlm_acc=58.47271 nsp_loss=0.06486 nsp_acc=97.518 throughput=129.0K tks/s lr=0.0000925 time=127.69 INFO:root:[step 74999] Saving checkpoints to /home/ubuntu/ckpt-master/0074999.params, /home/ubuntu/ckpt-master/0074999.states. INFO:root:[step 75249] mlm_loss=2.03613 mlm_acc=59.26205 nsp_loss=0.06135 nsp_acc=97.592 throughput=107.0K tks/s lr=0.0000925 time=137.98 INFO:root:[step 75499] mlm_loss=2.05861 mlm_acc=58.77233 nsp_loss=0.06449 nsp_acc=97.609 throughput=135.0K tks/s lr=0.0000925 time=115.86 INFO:root:[step 75749] mlm_loss=1.88789 mlm_acc=60.34113 nsp_loss=0.06398 nsp_acc=97.568 throughput=117.0K tks/s lr=0.0000924 time=121.79 INFO:root:[step 75999] mlm_loss=1.98037 mlm_acc=60.26163 nsp_loss=0.06569 nsp_acc=97.535 throughput=122.0K tks/s lr=0.0000924 time=110.22 INFO:root:[step 76249] mlm_loss=1.85976 mlm_acc=60.90891 nsp_loss=0.06313 nsp_acc=97.771 throughput=119.0K tks/s lr=0.0000924 time=108.36 INFO:root:[step 76499] mlm_loss=2.15671 mlm_acc=57.78906 nsp_loss=0.06000 nsp_acc=97.730 throughput=138.0K tks/s lr=0.0000924 time=133.46 INFO:root:[step 76749] mlm_loss=2.20051 mlm_acc=56.14115 nsp_loss=0.17397 nsp_acc=92.395 throughput=155.0K tks/s lr=0.0000923 time=153.10 INFO:root:[step 76999] mlm_loss=1.94837 mlm_acc=59.81682 nsp_loss=0.06682 nsp_acc=97.521 throughput=115.0K tks/s lr=0.0000923 time=121.21 INFO:root:[step 77249] mlm_loss=2.02564 mlm_acc=59.67278 nsp_loss=0.05580 nsp_acc=97.936 throughput=136.0K tks/s lr=0.0000923 time=115.78 INFO:root:[step 77499] mlm_loss=2.00501 mlm_acc=59.66953 nsp_loss=0.06048 nsp_acc=97.789 throughput=118.0K tks/s lr=0.0000923 time=120.15 INFO:root:[step 77749] mlm_loss=2.08098 mlm_acc=57.10832 nsp_loss=0.10635 nsp_acc=95.755 throughput=139.0K tks/s lr=0.0000922 time=136.84 INFO:root:[step 77999] mlm_loss=2.00139 mlm_acc=57.78461 nsp_loss=0.08798 nsp_acc=96.592 throughput=141.0K tks/s lr=0.0000922 time=120.10 INFO:root:[step 78249] mlm_loss=2.08338 mlm_acc=57.58001 nsp_loss=0.13702 nsp_acc=94.299 throughput=137.0K tks/s lr=0.0000922 time=138.11 INFO:root:[step 78499] mlm_loss=2.07862 mlm_acc=58.92552 nsp_loss=0.05707 nsp_acc=97.890 throughput=132.0K tks/s lr=0.0000922 time=123.62 INFO:root:[step 78749] mlm_loss=2.26416 mlm_acc=55.92157 nsp_loss=0.08495 nsp_acc=96.536 throughput=154.0K tks/s lr=0.0000921 time=153.12 INFO:root:[step 78999] mlm_loss=1.98100 mlm_acc=58.68122 nsp_loss=0.07344 nsp_acc=97.267 throughput=129.0K tks/s lr=0.0000921 time=120.39 INFO:root:[step 79249] mlm_loss=2.42778 mlm_acc=53.73853 nsp_loss=0.14987 nsp_acc=93.733 throughput=143.0K tks/s lr=0.0000921 time=143.65 INFO:root:[step 79499] mlm_loss=1.82147 mlm_acc=60.05751 nsp_loss=0.07171 nsp_acc=97.277 throughput=109.0K tks/s lr=0.0000921 time=114.60 INFO:root:[step 79749] mlm_loss=2.37170 mlm_acc=55.04568 nsp_loss=0.11277 nsp_acc=95.308 throughput=138.0K tks/s lr=0.0000920 time=137.87 INFO:root:[step 79999] mlm_loss=1.88446 mlm_acc=60.77934 nsp_loss=0.06134 nsp_acc=97.792 throughput=118.0K tks/s lr=0.0000920 time=106.20 INFO:root:[step 79999] Saving checkpoints to /home/ubuntu/ckpt-master/0079999.params, /home/ubuntu/ckpt-master/0079999.states. INFO:root:[step 80249] mlm_loss=2.13534 mlm_acc=56.43832 nsp_loss=0.08869 nsp_acc=96.441 throughput=128.0K tks/s lr=0.0000920 time=136.56 INFO:root:[step 80499] mlm_loss=1.92887 mlm_acc=60.39063 nsp_loss=0.06050 nsp_acc=97.824 throughput=113.0K tks/s lr=0.0000920 time=118.26 INFO:root:[step 80749] mlm_loss=1.90328 mlm_acc=60.36026 nsp_loss=0.06139 nsp_acc=97.728 throughput=122.0K tks/s lr=0.0000919 time=108.89 INFO:root:[step 80999] mlm_loss=1.86145 mlm_acc=61.02757 nsp_loss=0.05799 nsp_acc=97.855 throughput=119.0K tks/s lr=0.0000919 time=105.55 INFO:root:[step 81249] mlm_loss=1.77613 mlm_acc=65.03643 nsp_loss=0.08572 nsp_acc=96.816 throughput=146.0K tks/s lr=0.0000919 time=144.95 INFO:root:[step 81499] mlm_loss=2.11580 mlm_acc=59.40119 nsp_loss=0.05939 nsp_acc=97.794 throughput=134.0K tks/s lr=0.0000919 time=131.02 INFO:root:[step 81749] mlm_loss=2.14200 mlm_acc=58.57620 nsp_loss=0.05745 nsp_acc=97.849 throughput=133.0K tks/s lr=0.0000918 time=133.08 INFO:root:[step 81999] mlm_loss=2.19557 mlm_acc=57.55686 nsp_loss=0.08288 nsp_acc=96.695 throughput=144.0K tks/s lr=0.0000918 time=136.81 INFO:root:[step 82249] mlm_loss=2.20663 mlm_acc=56.77961 nsp_loss=0.08703 nsp_acc=96.479 throughput=145.0K tks/s lr=0.0000918 time=141.78 INFO:root:[step 82499] mlm_loss=2.16480 mlm_acc=56.65263 nsp_loss=0.09692 nsp_acc=96.076 throughput=139.0K tks/s lr=0.0000918 time=134.03 INFO:root:[step 82749] mlm_loss=1.96356 mlm_acc=60.50373 nsp_loss=0.05764 nsp_acc=97.885 throughput=128.0K tks/s lr=0.0000917 time=113.24 INFO:root:[step 82999] mlm_loss=1.97639 mlm_acc=59.94303 nsp_loss=0.05702 nsp_acc=97.911 throughput=121.0K tks/s lr=0.0000917 time=120.63 INFO:root:[step 83249] mlm_loss=2.08267 mlm_acc=59.36356 nsp_loss=0.05741 nsp_acc=97.825 throughput=139.0K tks/s lr=0.0000917 time=118.04 INFO:root:[step 83499] mlm_loss=2.17732 mlm_acc=57.14884 nsp_loss=0.12897 nsp_acc=94.526 throughput=148.0K tks/s lr=0.0000917 time=158.46 INFO:root:[step 83749] mlm_loss=2.20103 mlm_acc=58.23463 nsp_loss=0.05383 nsp_acc=97.941 throughput=142.0K tks/s lr=0.0000916 time=139.26 INFO:root:[step 83999] mlm_loss=2.08830 mlm_acc=58.98002 nsp_loss=0.06219 nsp_acc=97.716 throughput=136.0K tks/s lr=0.0000916 time=122.73 INFO:root:[step 84249] mlm_loss=2.12911 mlm_acc=58.95000 nsp_loss=0.05809 nsp_acc=97.813 throughput=134.0K tks/s lr=0.0000916 time=131.12 INFO:root:[step 84499] mlm_loss=1.78096 mlm_acc=62.13904 nsp_loss=0.06500 nsp_acc=97.690 throughput=121.0K tks/s lr=0.0000916 time=120.70 INFO:root:[step 84749] mlm_loss=2.10265 mlm_acc=59.18816 nsp_loss=0.05610 nsp_acc=97.886 throughput=142.0K tks/s lr=0.0000915 time=122.39 INFO:root:[step 84999] mlm_loss=1.91988 mlm_acc=60.67648 nsp_loss=0.05765 nsp_acc=97.908 throughput=117.0K tks/s lr=0.0000915 time=118.91 INFO:root:[step 84999] Saving checkpoints to /home/ubuntu/ckpt-master/0084999.params, /home/ubuntu/ckpt-master/0084999.states. INFO:root:[step 85249] mlm_loss=1.94881 mlm_acc=60.41345 nsp_loss=0.06204 nsp_acc=97.700 throughput=109.0K tks/s lr=0.0000915 time=123.43 INFO:root:[step 85499] mlm_loss=1.98102 mlm_acc=59.92634 nsp_loss=0.06522 nsp_acc=97.612 throughput=122.0K tks/s lr=0.0000915 time=117.44 INFO:root:[step 85749] mlm_loss=2.22507 mlm_acc=55.57907 nsp_loss=0.10315 nsp_acc=95.927 throughput=157.0K tks/s lr=0.0000914 time=160.18 INFO:root:[step 85999] mlm_loss=1.85499 mlm_acc=61.17533 nsp_loss=0.06684 nsp_acc=97.563 throughput=122.0K tks/s lr=0.0000914 time=108.86 INFO:root:[step 86249] mlm_loss=2.09863 mlm_acc=57.10211 nsp_loss=0.13307 nsp_acc=94.442 throughput=151.0K tks/s lr=0.0000914 time=163.17 INFO:root:[step 86499] mlm_loss=2.27533 mlm_acc=56.15688 nsp_loss=0.07784 nsp_acc=96.807 throughput=149.0K tks/s lr=0.0000914 time=145.16 INFO:root:[step 86749] mlm_loss=2.19249 mlm_acc=58.40848 nsp_loss=0.05501 nsp_acc=97.885 throughput=142.0K tks/s lr=0.0000913 time=139.28 INFO:root:[step 86999] mlm_loss=2.04906 mlm_acc=59.65959 nsp_loss=0.06065 nsp_acc=97.698 throughput=133.0K tks/s lr=0.0000913 time=116.66 INFO:root:[step 87249] mlm_loss=1.96137 mlm_acc=59.95738 nsp_loss=0.06165 nsp_acc=97.685 throughput=119.0K tks/s lr=0.0000913 time=121.09 INFO:root:[step 87499] mlm_loss=2.16872 mlm_acc=58.15639 nsp_loss=0.07514 nsp_acc=96.949 throughput=148.0K tks/s lr=0.0000913 time=142.52 INFO:root:[step 87749] mlm_loss=2.15987 mlm_acc=57.60942 nsp_loss=0.10150 nsp_acc=95.913 throughput=153.0K tks/s lr=0.0000912 time=172.59 INFO:root:[step 87999] mlm_loss=2.05296 mlm_acc=58.15179 nsp_loss=0.14484 nsp_acc=93.768 throughput=138.0K tks/s lr=0.0000912 time=123.01 INFO:root:[step 88249] mlm_loss=2.09608 mlm_acc=59.20946 nsp_loss=0.05574 nsp_acc=97.875 throughput=136.0K tks/s lr=0.0000912 time=130.64 INFO:root:[step 88499] mlm_loss=2.11366 mlm_acc=59.25120 nsp_loss=0.05912 nsp_acc=97.732 throughput=133.0K tks/s lr=0.0000912 time=127.18 INFO:root:[step 88749] mlm_loss=2.21942 mlm_acc=56.46895 nsp_loss=0.07934 nsp_acc=96.817 throughput=152.0K tks/s lr=0.0000911 time=153.13 INFO:root:[step 88999] mlm_loss=1.90758 mlm_acc=59.48753 nsp_loss=0.06486 nsp_acc=97.579 throughput=125.0K tks/s lr=0.0000911 time=124.62 INFO:root:[step 89249] mlm_loss=2.11179 mlm_acc=57.75033 nsp_loss=0.16785 nsp_acc=92.770 throughput=157.0K tks/s lr=0.0000911 time=165.57 INFO:root:[step 89499] mlm_loss=1.99657 mlm_acc=59.19701 nsp_loss=0.11103 nsp_acc=95.404 throughput=128.0K tks/s lr=0.0000911 time=116.26 INFO:root:[step 89749] mlm_loss=2.13766 mlm_acc=58.82122 nsp_loss=0.06187 nsp_acc=97.657 throughput=134.0K tks/s lr=0.0000910 time=128.79 INFO:root:[step 89999] mlm_loss=1.94089 mlm_acc=60.00098 nsp_loss=0.06943 nsp_acc=97.363 throughput=119.0K tks/s lr=0.0000910 time=118.80 INFO:root:[step 89999] Saving checkpoints to /home/ubuntu/ckpt-master/0089999.params, /home/ubuntu/ckpt-master/0089999.states. INFO:root:[step 90249] mlm_loss=2.20502 mlm_acc=56.91858 nsp_loss=0.11336 nsp_acc=95.190 throughput=134.0K tks/s lr=0.0000910 time=161.66 INFO:root:[step 90499] mlm_loss=2.12492 mlm_acc=57.56162 nsp_loss=0.12456 nsp_acc=94.751 throughput=145.0K tks/s lr=0.0000910 time=145.71 INFO:root:[step 90749] mlm_loss=1.98249 mlm_acc=59.95932 nsp_loss=0.05406 nsp_acc=97.987 throughput=134.0K tks/s lr=0.0000909 time=115.01 INFO:root:[step 90999] mlm_loss=2.19447 mlm_acc=56.46269 nsp_loss=0.10451 nsp_acc=95.703 throughput=153.0K tks/s lr=0.0000909 time=164.79 INFO:root:[step 91249] mlm_loss=2.12822 mlm_acc=58.38495 nsp_loss=0.05367 nsp_acc=98.042 throughput=139.0K tks/s lr=0.0000909 time=137.44 INFO:root:[step 91499] mlm_loss=1.88996 mlm_acc=60.87651 nsp_loss=0.05778 nsp_acc=97.902 throughput=123.0K tks/s lr=0.0000909 time=111.07 INFO:root:[step 91749] mlm_loss=2.06615 mlm_acc=58.60018 nsp_loss=0.07447 nsp_acc=97.027 throughput=144.0K tks/s lr=0.0000908 time=136.49 INFO:root:[step 91999] mlm_loss=2.09621 mlm_acc=58.38840 nsp_loss=0.08148 nsp_acc=96.792 throughput=135.0K tks/s lr=0.0000908 time=139.31 INFO:root:[step 92249] mlm_loss=1.97779 mlm_acc=59.32183 nsp_loss=0.06331 nsp_acc=97.581 throughput=131.0K tks/s lr=0.0000908 time=114.11 INFO:root:[step 92499] mlm_loss=2.14767 mlm_acc=57.89949 nsp_loss=0.11128 nsp_acc=95.408 throughput=145.0K tks/s lr=0.0000908 time=157.71 INFO:root:[step 92749] mlm_loss=2.07548 mlm_acc=58.94693 nsp_loss=0.11509 nsp_acc=95.400 throughput=160.0K tks/s lr=0.0000907 time=161.13 INFO:root:[step 92999] mlm_loss=2.09833 mlm_acc=58.58909 nsp_loss=0.06925 nsp_acc=97.278 throughput=143.0K tks/s lr=0.0000907 time=139.11 INFO:root:[step 93249] mlm_loss=2.07932 mlm_acc=58.43770 nsp_loss=0.10286 nsp_acc=95.842 throughput=150.0K tks/s lr=0.0000907 time=148.87 INFO:root:[step 93499] mlm_loss=1.87605 mlm_acc=61.04643 nsp_loss=0.05704 nsp_acc=97.917 throughput=112.0K tks/s lr=0.0000907 time=119.18 INFO:root:[step 93749] mlm_loss=1.87177 mlm_acc=59.87356 nsp_loss=0.07135 nsp_acc=97.217 throughput=130.0K tks/s lr=0.0000906 time=113.76 INFO:root:[step 93999] mlm_loss=2.13531 mlm_acc=58.49715 nsp_loss=0.07825 nsp_acc=97.012 throughput=146.0K tks/s lr=0.0000906 time=142.01 INFO:root:[step 94249] mlm_loss=1.94873 mlm_acc=58.96890 nsp_loss=0.07300 nsp_acc=97.241 throughput=132.0K tks/s lr=0.0000906 time=128.35 INFO:root:[step 94499] mlm_loss=1.95506 mlm_acc=59.27038 nsp_loss=0.07647 nsp_acc=97.078 throughput=133.0K tks/s lr=0.0000906 time=132.97 INFO:root:[step 94749] mlm_loss=1.85179 mlm_acc=61.99246 nsp_loss=0.10304 nsp_acc=95.960 throughput=147.0K tks/s lr=0.0000905 time=154.12 INFO:root:[step 94999] mlm_loss=1.92118 mlm_acc=59.55642 nsp_loss=0.12205 nsp_acc=94.803 throughput=136.0K tks/s lr=0.0000905 time=118.38 INFO:root:[step 94999] Saving checkpoints to /home/ubuntu/ckpt-master/0094999.params, /home/ubuntu/ckpt-master/0094999.states. INFO:root:[step 95249] mlm_loss=1.87879 mlm_acc=60.92535 nsp_loss=0.07151 nsp_acc=97.187 throughput=101.0K tks/s lr=0.0000905 time=134.85 INFO:root:[step 95499] mlm_loss=1.87685 mlm_acc=61.25950 nsp_loss=0.05871 nsp_acc=97.789 throughput=121.0K tks/s lr=0.0000905 time=108.35 INFO:root:[step 95749] mlm_loss=1.99439 mlm_acc=58.54810 nsp_loss=0.10207 nsp_acc=95.832 throughput=134.0K tks/s lr=0.0000904 time=134.26 INFO:root:[step 95999] mlm_loss=2.01506 mlm_acc=58.77323 nsp_loss=0.05961 nsp_acc=97.757 throughput=142.0K tks/s lr=0.0000904 time=121.15 INFO:root:[step 96249] mlm_loss=2.09385 mlm_acc=57.52141 nsp_loss=0.07502 nsp_acc=97.172 throughput=137.0K tks/s lr=0.0000904 time=136.35 INFO:root:[step 96499] mlm_loss=1.96608 mlm_acc=60.01794 nsp_loss=0.06613 nsp_acc=97.408 throughput=123.0K tks/s lr=0.0000904 time=118.78 INFO:root:[step 96749] mlm_loss=2.21801 mlm_acc=57.24662 nsp_loss=0.10375 nsp_acc=95.722 throughput=138.0K tks/s lr=0.0000903 time=139.81 INFO:root:[step 96999] mlm_loss=2.10536 mlm_acc=59.06320 nsp_loss=0.05214 nsp_acc=98.062 throughput=141.0K tks/s lr=0.0000903 time=124.34 INFO:root:[step 97249] mlm_loss=1.93895 mlm_acc=60.75899 nsp_loss=0.06006 nsp_acc=97.748 throughput=116.0K tks/s lr=0.0000903 time=118.71 INFO:root:[step 97499] mlm_loss=1.91798 mlm_acc=60.79961 nsp_loss=0.05937 nsp_acc=97.839 throughput=129.0K tks/s lr=0.0000903 time=114.76 INFO:root:[step 97749] mlm_loss=1.86970 mlm_acc=60.97904 nsp_loss=0.05629 nsp_acc=97.970 throughput=118.0K tks/s lr=0.0000902 time=117.21 INFO:root:[step 97999] mlm_loss=1.99257 mlm_acc=60.23558 nsp_loss=0.05731 nsp_acc=97.834 throughput=132.0K tks/s lr=0.0000902 time=116.40 INFO:root:[step 98249] mlm_loss=2.01069 mlm_acc=59.48210 nsp_loss=0.06834 nsp_acc=97.387 throughput=127.0K tks/s lr=0.0000902 time=122.13 INFO:root:[step 98499] mlm_loss=1.96666 mlm_acc=58.88966 nsp_loss=0.08110 nsp_acc=96.828 throughput=135.0K tks/s lr=0.0000902 time=123.54 INFO:root:[step 98749] mlm_loss=1.87064 mlm_acc=61.30500 nsp_loss=0.05312 nsp_acc=98.043 throughput=117.0K tks/s lr=0.0000901 time=117.66 INFO:root:[step 98999] mlm_loss=2.13812 mlm_acc=58.77393 nsp_loss=0.05151 nsp_acc=98.042 throughput=145.0K tks/s lr=0.0000901 time=140.92 INFO:root:[step 99249] mlm_loss=2.13085 mlm_acc=58.52870 nsp_loss=0.05508 nsp_acc=97.931 throughput=144.0K tks/s lr=0.0000901 time=140.24 INFO:root:[step 99499] mlm_loss=1.96260 mlm_acc=60.72112 nsp_loss=0.06002 nsp_acc=97.804 throughput=136.0K tks/s lr=0.0000901 time=115.95 INFO:root:[step 99749] mlm_loss=2.07806 mlm_acc=57.76407 nsp_loss=0.12259 nsp_acc=94.954 throughput=136.0K tks/s lr=0.0000900 time=134.42 INFO:root:[step 99999] mlm_loss=2.22213 mlm_acc=56.29755 nsp_loss=0.11479 nsp_acc=95.291 throughput=147.0K tks/s lr=0.0000900 time=159.74 INFO:root:[step 99999] Saving checkpoints to /home/ubuntu/ckpt-master/0099999.params, /home/ubuntu/ckpt-master/0099999.states. INFO:root:[step 100249] mlm_loss=1.92438 mlm_acc=60.60393 nsp_loss=0.06203 nsp_acc=97.736 throughput=117.0K tks/s lr=0.0000900 time=129.95 INFO:root:[step 100499] mlm_loss=2.11673 mlm_acc=57.95752 nsp_loss=0.09611 nsp_acc=96.168 throughput=150.0K tks/s lr=0.0000900 time=148.39 INFO:root:[step 100749] mlm_loss=2.13716 mlm_acc=58.06093 nsp_loss=0.08645 nsp_acc=96.597 throughput=150.0K tks/s lr=0.0000899 time=145.54 INFO:root:[step 100999] mlm_loss=2.05254 mlm_acc=59.70142 nsp_loss=0.05878 nsp_acc=97.798 throughput=130.0K tks/s lr=0.0000899 time=125.21 INFO:root:[step 101249] mlm_loss=1.52327 mlm_acc=69.31724 nsp_loss=0.08929 nsp_acc=96.811 throughput=142.0K tks/s lr=0.0000899 time=142.27 INFO:root:[step 101499] mlm_loss=1.86297 mlm_acc=60.99361 nsp_loss=0.06238 nsp_acc=97.731 throughput=124.0K tks/s lr=0.0000899 time=111.10 INFO:root:[step 101749] mlm_loss=2.02825 mlm_acc=59.72708 nsp_loss=0.05835 nsp_acc=97.837 throughput=131.0K tks/s lr=0.0000898 time=130.58 INFO:root:[step 101999] mlm_loss=2.06403 mlm_acc=56.98297 nsp_loss=0.06701 nsp_acc=97.522 throughput=138.0K tks/s lr=0.0000898 time=139.05 INFO:root:[step 102249] mlm_loss=2.05937 mlm_acc=57.40786 nsp_loss=0.09130 nsp_acc=96.421 throughput=133.0K tks/s lr=0.0000898 time=133.26 INFO:root:[step 102499] mlm_loss=1.99184 mlm_acc=58.80467 nsp_loss=0.09632 nsp_acc=96.226 throughput=139.0K tks/s lr=0.0000898 time=139.01 INFO:root:[step 102749] mlm_loss=1.81531 mlm_acc=61.80842 nsp_loss=0.06044 nsp_acc=97.812 throughput=121.0K tks/s lr=0.0000897 time=105.91 INFO:root:[step 102999] mlm_loss=1.81614 mlm_acc=61.82541 nsp_loss=0.06046 nsp_acc=97.826 throughput=118.0K tks/s lr=0.0000897 time=107.20 INFO:root:[step 103249] mlm_loss=2.15486 mlm_acc=56.71670 nsp_loss=0.09761 nsp_acc=96.144 throughput=160.0K tks/s lr=0.0000897 time=159.86 INFO:root:[step 103499] mlm_loss=1.99307 mlm_acc=58.62088 nsp_loss=0.07614 nsp_acc=97.130 throughput=140.0K tks/s lr=0.0000897 time=138.93 INFO:root:[step 103749] mlm_loss=2.08460 mlm_acc=59.47297 nsp_loss=0.05767 nsp_acc=97.862 throughput=133.0K tks/s lr=0.0000896 time=132.13 INFO:root:[step 103999] mlm_loss=1.85571 mlm_acc=61.64137 nsp_loss=0.05949 nsp_acc=97.812 throughput=119.0K tks/s lr=0.0000896 time=111.47 INFO:root:[step 104249] mlm_loss=1.88707 mlm_acc=60.14758 nsp_loss=0.08478 nsp_acc=96.622 throughput=126.0K tks/s lr=0.0000896 time=124.25 INFO:root:[step 104499] mlm_loss=2.24448 mlm_acc=56.54441 nsp_loss=0.10941 nsp_acc=95.368 throughput=152.0K tks/s lr=0.0000896 time=150.00 INFO:root:[step 104749] mlm_loss=1.92386 mlm_acc=60.73012 nsp_loss=0.05438 nsp_acc=97.985 throughput=123.0K tks/s lr=0.0000895 time=120.70 INFO:root:[step 104999] mlm_loss=2.09476 mlm_acc=59.61611 nsp_loss=0.05650 nsp_acc=97.824 throughput=136.0K tks/s lr=0.0000895 time=132.72 INFO:root:[step 104999] Saving checkpoints to /home/ubuntu/ckpt-master/0104999.params, /home/ubuntu/ckpt-master/0104999.states. INFO:root:[step 105249] mlm_loss=1.96149 mlm_acc=60.75393 nsp_loss=0.06229 nsp_acc=97.647 throughput=115.0K tks/s lr=0.0000895 time=128.01 INFO:root:[step 105499] mlm_loss=1.89947 mlm_acc=61.36654 nsp_loss=0.05759 nsp_acc=97.876 throughput=127.0K tks/s lr=0.0000895 time=110.11 INFO:root:[step 105749] mlm_loss=1.97534 mlm_acc=60.70588 nsp_loss=0.05693 nsp_acc=97.899 throughput=120.0K tks/s lr=0.0000894 time=121.77 INFO:root:[step 105999] mlm_loss=1.84359 mlm_acc=61.91786 nsp_loss=0.06016 nsp_acc=97.809 throughput=121.0K tks/s lr=0.0000894 time=108.39 INFO:root:[step 106249] mlm_loss=1.99444 mlm_acc=57.99202 nsp_loss=0.09307 nsp_acc=96.294 throughput=134.0K tks/s lr=0.0000894 time=133.79 INFO:root:[step 106499] mlm_loss=1.80123 mlm_acc=61.92865 nsp_loss=0.05671 nsp_acc=97.891 throughput=120.0K tks/s lr=0.0000894 time=105.44 INFO:root:[step 106749] mlm_loss=2.10635 mlm_acc=57.61878 nsp_loss=0.06713 nsp_acc=97.392 throughput=151.0K tks/s lr=0.0000893 time=146.71 INFO:root:[step 106999] mlm_loss=1.90344 mlm_acc=60.40467 nsp_loss=0.06168 nsp_acc=97.741 throughput=125.0K tks/s lr=0.0000893 time=121.81 INFO:root:[step 107249] mlm_loss=2.10401 mlm_acc=59.22235 nsp_loss=0.05387 nsp_acc=97.958 throughput=141.0K tks/s lr=0.0000893 time=136.56 INFO:root:[step 107499] mlm_loss=1.73390 mlm_acc=62.09960 nsp_loss=0.06831 nsp_acc=97.508 throughput=123.0K tks/s lr=0.0000893 time=113.67 INFO:root:[step 107749] mlm_loss=1.98519 mlm_acc=59.40908 nsp_loss=0.08329 nsp_acc=96.674 throughput=140.0K tks/s lr=0.0000892 time=137.05 INFO:root:[step 107999] mlm_loss=2.24099 mlm_acc=56.61422 nsp_loss=0.09901 nsp_acc=96.000 throughput=153.0K tks/s lr=0.0000892 time=166.10 INFO:root:[step 108249] mlm_loss=2.14968 mlm_acc=57.78782 nsp_loss=0.08568 nsp_acc=96.658 throughput=145.0K tks/s lr=0.0000892 time=144.32 INFO:root:[step 108499] mlm_loss=1.96764 mlm_acc=60.81267 nsp_loss=0.05686 nsp_acc=97.829 throughput=130.0K tks/s lr=0.0000892 time=128.19 INFO:root:[step 108749] mlm_loss=1.71974 mlm_acc=62.76758 nsp_loss=0.06228 nsp_acc=97.771 throughput=122.0K tks/s lr=0.0000891 time=109.82 INFO:root:[step 108999] mlm_loss=1.74468 mlm_acc=62.51667 nsp_loss=0.06004 nsp_acc=97.840 throughput=117.0K tks/s lr=0.0000891 time=105.68 INFO:root:[step 109249] mlm_loss=1.97072 mlm_acc=60.49018 nsp_loss=0.05789 nsp_acc=97.839 throughput=129.0K tks/s lr=0.0000891 time=124.76 INFO:root:[step 109499] mlm_loss=2.02927 mlm_acc=60.25582 nsp_loss=0.05764 nsp_acc=97.893 throughput=138.0K tks/s lr=0.0000891 time=122.31 INFO:root:[step 109749] mlm_loss=2.22713 mlm_acc=56.02798 nsp_loss=0.10493 nsp_acc=95.737 throughput=145.0K tks/s lr=0.0000890 time=160.85 INFO:root:[step 109999] mlm_loss=1.81453 mlm_acc=62.19795 nsp_loss=0.05546 nsp_acc=98.013 throughput=126.0K tks/s lr=0.0000890 time=112.81 INFO:root:[step 109999] Saving checkpoints to /home/ubuntu/ckpt-master/0109999.params, /home/ubuntu/ckpt-master/0109999.states. INFO:root:[step 110249] mlm_loss=1.81000 mlm_acc=62.28553 nsp_loss=0.05644 nsp_acc=97.982 throughput=104.0K tks/s lr=0.0000890 time=122.39 INFO:root:[step 110499] mlm_loss=1.92928 mlm_acc=60.88755 nsp_loss=0.05867 nsp_acc=97.832 throughput=119.0K tks/s lr=0.0000890 time=120.83 INFO:root:[step 110749] mlm_loss=1.80485 mlm_acc=61.77599 nsp_loss=0.06003 nsp_acc=97.807 throughput=121.0K tks/s lr=0.0000889 time=108.02 INFO:root:[step 110999] mlm_loss=1.79233 mlm_acc=62.09260 nsp_loss=0.05855 nsp_acc=97.859 throughput=123.0K tks/s lr=0.0000889 time=108.35 INFO:root:[step 111249] mlm_loss=1.80512 mlm_acc=62.19130 nsp_loss=0.05750 nsp_acc=97.894 throughput=110.0K tks/s lr=0.0000889 time=117.41 INFO:root:[step 111499] mlm_loss=1.89677 mlm_acc=61.26282 nsp_loss=0.06012 nsp_acc=97.775 throughput=123.0K tks/s lr=0.0000889 time=111.64 INFO:root:[step 111749] mlm_loss=1.75972 mlm_acc=61.88588 nsp_loss=0.06993 nsp_acc=97.355 throughput=117.0K tks/s lr=0.0000888 time=106.17 INFO:root:[step 111999] mlm_loss=1.72719 mlm_acc=62.11595 nsp_loss=0.10196 nsp_acc=96.023 throughput=116.0K tks/s lr=0.0000888 time=118.40 INFO:root:[step 112249] mlm_loss=2.16212 mlm_acc=57.59554 nsp_loss=0.12120 nsp_acc=94.871 throughput=153.0K tks/s lr=0.0000888 time=151.97 INFO:root:[step 112499] mlm_loss=2.13140 mlm_acc=58.20354 nsp_loss=0.12083 nsp_acc=94.915 throughput=155.0K tks/s lr=0.0000888 time=153.94 INFO:root:[step 112749] mlm_loss=1.87456 mlm_acc=61.01611 nsp_loss=0.06351 nsp_acc=97.661 throughput=124.0K tks/s lr=0.0000887 time=127.01 INFO:root:[step 112999] mlm_loss=2.00864 mlm_acc=60.79431 nsp_loss=0.05542 nsp_acc=97.913 throughput=131.0K tks/s lr=0.0000887 time=130.14 INFO:root:[step 113249] mlm_loss=1.98687 mlm_acc=59.29610 nsp_loss=0.07554 nsp_acc=97.065 throughput=143.0K tks/s lr=0.0000887 time=124.18 INFO:root:[step 113499] mlm_loss=1.86929 mlm_acc=60.16994 nsp_loss=0.08195 nsp_acc=96.834 throughput=129.0K tks/s lr=0.0000887 time=129.23 INFO:root:[step 113749] mlm_loss=1.94117 mlm_acc=59.92571 nsp_loss=0.08972 nsp_acc=96.378 throughput=130.0K tks/s lr=0.0000886 time=129.70 INFO:root:[step 113999] mlm_loss=1.92682 mlm_acc=60.72619 nsp_loss=0.05902 nsp_acc=97.824 throughput=129.0K tks/s lr=0.0000886 time=112.65 INFO:root:[step 114249] mlm_loss=2.07743 mlm_acc=59.55689 nsp_loss=0.05278 nsp_acc=97.976 throughput=141.0K tks/s lr=0.0000886 time=132.63 INFO:root:[step 114499] mlm_loss=1.89778 mlm_acc=60.73442 nsp_loss=0.05548 nsp_acc=97.877 throughput=133.0K tks/s lr=0.0000886 time=118.78 INFO:root:[step 114749] mlm_loss=2.01958 mlm_acc=60.16139 nsp_loss=0.05300 nsp_acc=98.070 throughput=133.0K tks/s lr=0.0000885 time=130.89 INFO:root:[step 114999] mlm_loss=2.02930 mlm_acc=58.43923 nsp_loss=0.11466 nsp_acc=95.371 throughput=155.0K tks/s lr=0.0000885 time=168.80 INFO:root:[step 114999] Saving checkpoints to /home/ubuntu/ckpt-master/0114999.params, /home/ubuntu/ckpt-master/0114999.states. INFO:root:[step 115249] mlm_loss=2.08996 mlm_acc=59.68285 nsp_loss=0.05095 nsp_acc=98.064 throughput=129.0K tks/s lr=0.0000885 time=152.64 INFO:root:[step 115499] mlm_loss=1.91986 mlm_acc=61.68713 nsp_loss=0.05717 nsp_acc=97.833 throughput=137.0K tks/s lr=0.0000885 time=123.05 INFO:root:[step 115749] mlm_loss=1.87714 mlm_acc=59.80245 nsp_loss=0.10524 nsp_acc=95.770 throughput=133.0K tks/s lr=0.0000884 time=134.31 INFO:root:[step 115999] mlm_loss=1.80539 mlm_acc=62.16398 nsp_loss=0.05797 nsp_acc=97.872 throughput=121.0K tks/s lr=0.0000884 time=106.83 INFO:root:[step 116249] mlm_loss=1.97726 mlm_acc=60.70714 nsp_loss=0.05388 nsp_acc=98.081 throughput=125.0K tks/s lr=0.0000884 time=127.60 INFO:root:[step 116499] mlm_loss=1.93063 mlm_acc=61.29861 nsp_loss=0.05859 nsp_acc=97.835 throughput=130.0K tks/s lr=0.0000884 time=113.45 INFO:root:[step 116749] mlm_loss=1.90785 mlm_acc=59.57696 nsp_loss=0.06802 nsp_acc=97.449 throughput=129.0K tks/s lr=0.0000883 time=126.70 INFO:root:[step 116999] mlm_loss=1.93162 mlm_acc=59.78744 nsp_loss=0.06307 nsp_acc=97.636 throughput=125.0K tks/s lr=0.0000883 time=127.62 INFO:root:[step 117249] mlm_loss=1.63253 mlm_acc=68.16257 nsp_loss=0.08177 nsp_acc=96.953 throughput=145.0K tks/s lr=0.0000883 time=126.19 INFO:root:[step 117499] mlm_loss=1.82566 mlm_acc=63.28125 nsp_loss=0.06259 nsp_acc=97.706 throughput=123.0K tks/s lr=0.0000883 time=125.39 INFO:root:[step 117749] mlm_loss=2.04904 mlm_acc=59.33811 nsp_loss=0.05914 nsp_acc=97.772 throughput=143.0K tks/s lr=0.0000882 time=134.64 INFO:root:[step 117999] mlm_loss=2.06632 mlm_acc=57.76972 nsp_loss=0.17466 nsp_acc=92.322 throughput=143.0K tks/s lr=0.0000882 time=148.89 INFO:root:[step 118249] mlm_loss=1.93819 mlm_acc=60.24444 nsp_loss=0.10307 nsp_acc=95.744 throughput=147.0K tks/s lr=0.0000882 time=143.60 INFO:root:[step 118499] mlm_loss=2.16209 mlm_acc=57.80513 nsp_loss=0.07939 nsp_acc=96.866 throughput=155.0K tks/s lr=0.0000882 time=154.28 INFO:root:[step 118749] mlm_loss=2.09916 mlm_acc=59.11060 nsp_loss=0.09379 nsp_acc=96.157 throughput=144.0K tks/s lr=0.0000881 time=142.21 INFO:root:[step 118999] mlm_loss=1.98561 mlm_acc=60.29190 nsp_loss=0.07008 nsp_acc=97.254 throughput=134.0K tks/s lr=0.0000881 time=129.60 INFO:root:[step 119249] mlm_loss=1.84246 mlm_acc=62.15081 nsp_loss=0.05418 nsp_acc=98.011 throughput=131.0K tks/s lr=0.0000881 time=113.86 INFO:root:[step 119499] mlm_loss=1.96619 mlm_acc=59.88262 nsp_loss=0.08436 nsp_acc=96.531 throughput=143.0K tks/s lr=0.0000881 time=137.39 INFO:root:[step 119749] mlm_loss=2.08833 mlm_acc=59.59614 nsp_loss=0.05945 nsp_acc=97.670 throughput=146.0K tks/s lr=0.0000880 time=142.69 INFO:root:[step 119999] mlm_loss=1.91671 mlm_acc=61.28104 nsp_loss=0.05894 nsp_acc=97.727 throughput=123.0K tks/s lr=0.0000880 time=122.55 INFO:root:[step 119999] Saving checkpoints to /home/ubuntu/ckpt-master/0119999.params, /home/ubuntu/ckpt-master/0119999.states. INFO:root:[step 120249] mlm_loss=2.12013 mlm_acc=58.24093 nsp_loss=0.08749 nsp_acc=96.431 throughput=127.0K tks/s lr=0.0000880 time=153.53 INFO:root:[step 120499] mlm_loss=1.93895 mlm_acc=61.00399 nsp_loss=0.05346 nsp_acc=98.029 throughput=135.0K tks/s lr=0.0000880 time=116.02 INFO:root:[step 120749] mlm_loss=1.85863 mlm_acc=61.71047 nsp_loss=0.05749 nsp_acc=97.878 throughput=121.0K tks/s lr=0.0000879 time=121.30 INFO:root:[step 120999] mlm_loss=1.77774 mlm_acc=62.71393 nsp_loss=0.06014 nsp_acc=97.776 throughput=117.0K tks/s lr=0.0000879 time=102.97 INFO:root:[step 121249] mlm_loss=1.85112 mlm_acc=61.88785 nsp_loss=0.05778 nsp_acc=97.814 throughput=116.0K tks/s lr=0.0000879 time=119.29 INFO:root:[step 121499] mlm_loss=1.91701 mlm_acc=60.77763 nsp_loss=0.05811 nsp_acc=97.801 throughput=145.0K tks/s lr=0.0000879 time=123.87 INFO:root:[step 121749] mlm_loss=2.07578 mlm_acc=57.68550 nsp_loss=0.13826 nsp_acc=94.154 throughput=142.0K tks/s lr=0.0000878 time=166.12 INFO:root:[step 121999] mlm_loss=1.85008 mlm_acc=59.42548 nsp_loss=0.08192 nsp_acc=96.891 throughput=141.0K tks/s lr=0.0000878 time=125.29 INFO:root:[step 122249] mlm_loss=1.94883 mlm_acc=60.69308 nsp_loss=0.05891 nsp_acc=97.822 throughput=127.0K tks/s lr=0.0000878 time=127.50 INFO:root:[step 122499] mlm_loss=2.02104 mlm_acc=59.95490 nsp_loss=0.05293 nsp_acc=98.089 throughput=139.0K tks/s lr=0.0000878 time=134.26 INFO:root:[step 122749] mlm_loss=1.88451 mlm_acc=61.79991 nsp_loss=0.05472 nsp_acc=97.954 throughput=130.0K tks/s lr=0.0000877 time=114.56 INFO:root:[step 122999] mlm_loss=1.85999 mlm_acc=61.96256 nsp_loss=0.05812 nsp_acc=97.830 throughput=113.0K tks/s lr=0.0000877 time=119.70 INFO:root:[step 123249] mlm_loss=1.86153 mlm_acc=61.90892 nsp_loss=0.05569 nsp_acc=97.893 throughput=133.0K tks/s lr=0.0000877 time=113.17 INFO:root:[step 123499] mlm_loss=1.98631 mlm_acc=60.63430 nsp_loss=0.05409 nsp_acc=98.006 throughput=131.0K tks/s lr=0.0000877 time=131.39 INFO:root:[step 123749] mlm_loss=1.76013 mlm_acc=62.82635 nsp_loss=0.05651 nsp_acc=97.959 throughput=119.0K tks/s lr=0.0000876 time=108.35 INFO:root:[step 123999] mlm_loss=2.03950 mlm_acc=59.61399 nsp_loss=0.04880 nsp_acc=98.145 throughput=148.0K tks/s lr=0.0000876 time=142.21 INFO:root:[step 124249] mlm_loss=1.99344 mlm_acc=60.59420 nsp_loss=0.05377 nsp_acc=97.960 throughput=133.0K tks/s lr=0.0000876 time=132.45 INFO:root:[step 124499] mlm_loss=1.82978 mlm_acc=62.34783 nsp_loss=0.05953 nsp_acc=97.769 throughput=111.0K tks/s lr=0.0000876 time=115.75 INFO:root:[step 124749] mlm_loss=1.94537 mlm_acc=61.05112 nsp_loss=0.05707 nsp_acc=97.821 throughput=136.0K tks/s lr=0.0000875 time=115.76 INFO:root:[step 124999] mlm_loss=1.92126 mlm_acc=59.72447 nsp_loss=0.09186 nsp_acc=96.420 throughput=140.0K tks/s lr=0.0000875 time=142.31 INFO:root:[step 124999] Saving checkpoints to /home/ubuntu/ckpt-master/0124999.params, /home/ubuntu/ckpt-master/0124999.states. INFO:root:[step 125249] mlm_loss=1.91893 mlm_acc=61.13738 nsp_loss=0.05398 nsp_acc=98.019 throughput=117.0K tks/s lr=0.0000875 time=141.46 INFO:root:[step 125499] mlm_loss=2.05123 mlm_acc=58.62709 nsp_loss=0.06906 nsp_acc=97.317 throughput=144.0K tks/s lr=0.0000875 time=143.61 INFO:root:[step 125749] mlm_loss=1.80383 mlm_acc=62.43239 nsp_loss=0.05224 nsp_acc=98.127 throughput=127.0K tks/s lr=0.0000874 time=109.98 INFO:root:[step 125999] mlm_loss=2.03406 mlm_acc=57.98686 nsp_loss=0.08070 nsp_acc=96.833 throughput=153.0K tks/s lr=0.0000874 time=148.96 INFO:root:[step 126249] mlm_loss=1.95916 mlm_acc=59.86897 nsp_loss=0.07722 nsp_acc=96.960 throughput=125.0K tks/s lr=0.0000874 time=126.75 INFO:root:[step 126499] mlm_loss=2.06761 mlm_acc=58.83172 nsp_loss=0.07345 nsp_acc=97.116 throughput=130.0K tks/s lr=0.0000874 time=132.74 INFO:root:[step 126749] mlm_loss=1.96075 mlm_acc=59.08839 nsp_loss=0.06497 nsp_acc=97.519 throughput=147.0K tks/s lr=0.0000873 time=124.94 INFO:root:[step 126999] mlm_loss=2.25733 mlm_acc=57.02318 nsp_loss=0.09114 nsp_acc=96.364 throughput=143.0K tks/s lr=0.0000873 time=140.78 INFO:root:[step 127249] mlm_loss=2.07017 mlm_acc=58.63941 nsp_loss=0.09972 nsp_acc=96.062 throughput=142.0K tks/s lr=0.0000873 time=140.86 INFO:root:[step 127499] mlm_loss=2.08047 mlm_acc=58.71426 nsp_loss=0.10726 nsp_acc=95.483 throughput=146.0K tks/s lr=0.0000873 time=157.58 INFO:root:[step 127749] mlm_loss=1.94858 mlm_acc=60.22484 nsp_loss=0.05529 nsp_acc=97.948 throughput=136.0K tks/s lr=0.0000872 time=129.33 INFO:root:[step 127999] mlm_loss=1.82651 mlm_acc=60.95740 nsp_loss=0.11666 nsp_acc=95.278 throughput=132.0K tks/s lr=0.0000872 time=134.62 INFO:root:[step 128249] mlm_loss=1.92797 mlm_acc=60.73155 nsp_loss=0.05473 nsp_acc=97.966 throughput=130.0K tks/s lr=0.0000872 time=130.66 INFO:root:[step 128499] mlm_loss=1.88815 mlm_acc=59.81667 nsp_loss=0.09115 nsp_acc=96.441 throughput=135.0K tks/s lr=0.0000872 time=137.75 INFO:root:[step 128749] mlm_loss=1.79789 mlm_acc=62.45639 nsp_loss=0.05484 nsp_acc=98.024 throughput=119.0K tks/s lr=0.0000871 time=107.15 INFO:root:[step 128999] mlm_loss=1.79125 mlm_acc=62.41510 nsp_loss=0.05619 nsp_acc=97.954 throughput=118.0K tks/s lr=0.0000871 time=109.98 INFO:root:[step 129249] mlm_loss=1.93595 mlm_acc=60.91232 nsp_loss=0.05155 nsp_acc=98.165 throughput=131.0K tks/s lr=0.0000871 time=131.95 INFO:root:[step 129499] mlm_loss=1.85243 mlm_acc=61.87844 nsp_loss=0.05590 nsp_acc=97.995 throughput=130.0K tks/s lr=0.0000871 time=113.81 INFO:root:[step 129749] mlm_loss=1.76874 mlm_acc=62.36031 nsp_loss=0.05829 nsp_acc=97.842 throughput=113.0K tks/s lr=0.0000870 time=116.25 INFO:root:[step 129999] mlm_loss=1.96671 mlm_acc=60.76783 nsp_loss=0.05570 nsp_acc=97.951 throughput=134.0K tks/s lr=0.0000870 time=119.79 INFO:root:[step 129999] Saving checkpoints to /home/ubuntu/ckpt-master/0129999.params, /home/ubuntu/ckpt-master/0129999.states. INFO:root:[step 130249] mlm_loss=2.02989 mlm_acc=59.46883 nsp_loss=0.07946 nsp_acc=96.891 throughput=137.0K tks/s lr=0.0000870 time=161.69 INFO:root:[step 130499] mlm_loss=2.02390 mlm_acc=58.95870 nsp_loss=0.07201 nsp_acc=97.207 throughput=142.0K tks/s lr=0.0000870 time=137.24 INFO:root:[step 130749] mlm_loss=2.05810 mlm_acc=58.65991 nsp_loss=0.08778 nsp_acc=96.582 throughput=139.0K tks/s lr=0.0000869 time=138.89 INFO:root:[step 130999] mlm_loss=1.77140 mlm_acc=62.68895 nsp_loss=0.05840 nsp_acc=97.873 throughput=117.0K tks/s lr=0.0000869 time=105.33 INFO:root:[step 131249] mlm_loss=1.93395 mlm_acc=60.98548 nsp_loss=0.05281 nsp_acc=98.016 throughput=129.0K tks/s lr=0.0000869 time=125.05 INFO:root:[step 131499] mlm_loss=1.87425 mlm_acc=61.65786 nsp_loss=0.05679 nsp_acc=97.933 throughput=118.0K tks/s lr=0.0000869 time=122.87 INFO:root:[step 131749] mlm_loss=1.89603 mlm_acc=61.50750 nsp_loss=0.05804 nsp_acc=97.818 throughput=128.0K tks/s lr=0.0000868 time=113.67 INFO:root:[step 131999] mlm_loss=2.04039 mlm_acc=58.18854 nsp_loss=0.11001 nsp_acc=95.274 throughput=153.0K tks/s lr=0.0000868 time=154.28 INFO:root:[step 132249] mlm_loss=1.94012 mlm_acc=60.17386 nsp_loss=0.06202 nsp_acc=97.625 throughput=134.0K tks/s lr=0.0000868 time=135.89 INFO:root:[step 132499] mlm_loss=2.03286 mlm_acc=58.55496 nsp_loss=0.06737 nsp_acc=97.554 throughput=143.0K tks/s lr=0.0000868 time=137.96 INFO:root:[step 132749] mlm_loss=1.95894 mlm_acc=61.12207 nsp_loss=0.05359 nsp_acc=98.020 throughput=129.0K tks/s lr=0.0000867 time=128.43 INFO:root:[step 132999] mlm_loss=1.79957 mlm_acc=61.11137 nsp_loss=0.09803 nsp_acc=95.957 throughput=142.0K tks/s lr=0.0000867 time=122.70 INFO:root:[step 133249] mlm_loss=1.93334 mlm_acc=61.14718 nsp_loss=0.06070 nsp_acc=97.760 throughput=130.0K tks/s lr=0.0000867 time=128.66 INFO:root:[step 133499] mlm_loss=2.06353 mlm_acc=60.14698 nsp_loss=0.05193 nsp_acc=98.071 throughput=143.0K tks/s lr=0.0000867 time=138.10 INFO:root:[step 133749] mlm_loss=2.19700 mlm_acc=56.77005 nsp_loss=0.09703 nsp_acc=96.085 throughput=157.0K tks/s lr=0.0000866 time=156.80 INFO:root:[step 133999] mlm_loss=2.04648 mlm_acc=59.55179 nsp_loss=0.08569 nsp_acc=96.641 throughput=151.0K tks/s lr=0.0000866 time=162.85 INFO:root:[step 134249] mlm_loss=1.86921 mlm_acc=61.38711 nsp_loss=0.05169 nsp_acc=98.055 throughput=135.0K tks/s lr=0.0000866 time=119.12 INFO:root:[step 134499] mlm_loss=1.95825 mlm_acc=60.77533 nsp_loss=0.05303 nsp_acc=98.023 throughput=134.0K tks/s lr=0.0000866 time=128.98 INFO:root:[step 134749] mlm_loss=1.99717 mlm_acc=60.45014 nsp_loss=0.05232 nsp_acc=98.058 throughput=140.0K tks/s lr=0.0000865 time=135.15 INFO:root:[step 134999] mlm_loss=2.01005 mlm_acc=60.84128 nsp_loss=0.05426 nsp_acc=97.954 throughput=135.0K tks/s lr=0.0000865 time=131.58 INFO:root:[step 134999] Saving checkpoints to /home/ubuntu/ckpt-master/0134999.params, /home/ubuntu/ckpt-master/0134999.states. INFO:root:[step 135249] mlm_loss=1.71438 mlm_acc=62.59960 nsp_loss=0.06308 nsp_acc=97.700 throughput=105.0K tks/s lr=0.0000865 time=128.27 INFO:root:[step 135499] mlm_loss=2.03530 mlm_acc=58.33005 nsp_loss=0.12702 nsp_acc=94.724 throughput=150.0K tks/s lr=0.0000865 time=164.19 INFO:root:[step 135749] mlm_loss=1.88795 mlm_acc=59.80555 nsp_loss=0.07255 nsp_acc=97.197 throughput=139.0K tks/s lr=0.0000864 time=130.02 INFO:root:[step 135999] mlm_loss=1.72062 mlm_acc=61.41238 nsp_loss=0.09235 nsp_acc=96.435 throughput=128.0K tks/s lr=0.0000864 time=134.68 INFO:root:[step 136249] mlm_loss=1.59622 mlm_acc=64.17034 nsp_loss=0.05919 nsp_acc=97.879 throughput=109.0K tks/s lr=0.0000864 time=102.99 INFO:root:[step 136499] mlm_loss=1.75162 mlm_acc=63.21993 nsp_loss=0.05405 nsp_acc=98.044 throughput=123.0K tks/s lr=0.0000864 time=107.07 INFO:root:[step 136749] mlm_loss=2.02046 mlm_acc=59.57804 nsp_loss=0.15186 nsp_acc=93.393 throughput=128.0K tks/s lr=0.0000863 time=132.07 INFO:root:[step 136999] mlm_loss=1.84591 mlm_acc=62.17107 nsp_loss=0.05656 nsp_acc=97.884 throughput=117.0K tks/s lr=0.0000863 time=124.59 INFO:root:[step 137249] mlm_loss=1.50635 mlm_acc=64.93077 nsp_loss=0.06328 nsp_acc=97.751 throughput=106.0K tks/s lr=0.0000863 time=97.56 INFO:root:[step 137499] mlm_loss=1.99837 mlm_acc=59.58491 nsp_loss=0.07034 nsp_acc=97.335 throughput=146.0K tks/s lr=0.0000863 time=149.08 INFO:root:[step 137749] mlm_loss=1.74876 mlm_acc=62.76622 nsp_loss=0.05858 nsp_acc=97.798 throughput=114.0K tks/s lr=0.0000862 time=105.44 INFO:root:[step 137999] mlm_loss=1.82710 mlm_acc=62.09486 nsp_loss=0.05694 nsp_acc=97.889 throughput=132.0K tks/s lr=0.0000862 time=117.52 INFO:root:[step 138249] mlm_loss=1.73973 mlm_acc=61.50402 nsp_loss=0.07091 nsp_acc=97.373 throughput=125.0K tks/s lr=0.0000862 time=123.83 INFO:root:[step 138499] mlm_loss=1.91976 mlm_acc=60.29161 nsp_loss=0.06825 nsp_acc=97.292 throughput=132.0K tks/s lr=0.0000862 time=131.49 INFO:root:[step 138749] mlm_loss=1.93683 mlm_acc=61.26889 nsp_loss=0.05344 nsp_acc=98.013 throughput=139.0K tks/s lr=0.0000861 time=120.11 INFO:root:[step 138999] mlm_loss=2.06965 mlm_acc=60.22668 nsp_loss=0.04995 nsp_acc=98.114 throughput=145.0K tks/s lr=0.0000861 time=138.51 INFO:root:[step 139249] mlm_loss=1.93444 mlm_acc=61.17571 nsp_loss=0.05541 nsp_acc=97.948 throughput=129.0K tks/s lr=0.0000861 time=130.88 INFO:root:[step 139499] mlm_loss=1.81769 mlm_acc=62.41793 nsp_loss=0.05505 nsp_acc=98.025 throughput=124.0K tks/s lr=0.0000861 time=110.86 INFO:root:[step 139749] mlm_loss=2.03702 mlm_acc=60.33691 nsp_loss=0.05070 nsp_acc=98.102 throughput=144.0K tks/s lr=0.0000860 time=138.65 INFO:root:[step 139999] mlm_loss=2.15730 mlm_acc=58.25803 nsp_loss=0.09504 nsp_acc=96.129 throughput=136.0K tks/s lr=0.0000860 time=152.30 INFO:root:[step 139999] Saving checkpoints to /home/ubuntu/ckpt-master/0139999.params, /home/ubuntu/ckpt-master/0139999.states. INFO:root:[step 140249] mlm_loss=1.75350 mlm_acc=62.98510 nsp_loss=0.05531 nsp_acc=98.035 throughput=108.0K tks/s lr=0.0000860 time=125.23 INFO:root:[step 140499] mlm_loss=1.83315 mlm_acc=62.30057 nsp_loss=0.05673 nsp_acc=97.943 throughput=128.0K tks/s lr=0.0000860 time=114.61 INFO:root:[step 140749] mlm_loss=1.77431 mlm_acc=62.56004 nsp_loss=0.05786 nsp_acc=97.867 throughput=118.0K tks/s lr=0.0000859 time=121.57 INFO:root:[step 140999] mlm_loss=1.86098 mlm_acc=62.26184 nsp_loss=0.05449 nsp_acc=97.933 throughput=127.0K tks/s lr=0.0000859 time=112.80 INFO:root:[step 141249] mlm_loss=1.92371 mlm_acc=61.45028 nsp_loss=0.05169 nsp_acc=98.132 throughput=133.0K tks/s lr=0.0000859 time=125.68 INFO:root:[step 141499] mlm_loss=1.95434 mlm_acc=61.07881 nsp_loss=0.05207 nsp_acc=98.029 throughput=135.0K tks/s lr=0.0000859 time=133.16 INFO:root:[step 141749] mlm_loss=2.01894 mlm_acc=60.27389 nsp_loss=0.05133 nsp_acc=98.057 throughput=139.0K tks/s lr=0.0000858 time=137.81 INFO:root:[step 141999] mlm_loss=1.93757 mlm_acc=61.45699 nsp_loss=0.05426 nsp_acc=98.044 throughput=138.0K tks/s lr=0.0000858 time=117.45 INFO:root:[step 142249] mlm_loss=2.03974 mlm_acc=59.40537 nsp_loss=0.09806 nsp_acc=95.997 throughput=145.0K tks/s lr=0.0000858 time=162.37 INFO:root:[step 142499] mlm_loss=1.84334 mlm_acc=60.80456 nsp_loss=0.11592 nsp_acc=94.985 throughput=140.0K tks/s lr=0.0000858 time=122.63 INFO:root:[step 142749] mlm_loss=1.78566 mlm_acc=62.37730 nsp_loss=0.07362 nsp_acc=97.168 throughput=115.0K tks/s lr=0.0000857 time=118.13 INFO:root:[step 142999] mlm_loss=1.84252 mlm_acc=62.23410 nsp_loss=0.05538 nsp_acc=97.951 throughput=126.0K tks/s lr=0.0000857 time=113.85 INFO:root:[step 143249] mlm_loss=1.94631 mlm_acc=59.53486 nsp_loss=0.11144 nsp_acc=95.332 throughput=144.0K tks/s lr=0.0000857 time=141.17 INFO:root:[step 143499] mlm_loss=2.08917 mlm_acc=58.12043 nsp_loss=0.12006 nsp_acc=95.054 throughput=157.0K tks/s lr=0.0000857 time=175.32 INFO:root:[step 143749] mlm_loss=2.00073 mlm_acc=61.02975 nsp_loss=0.05278 nsp_acc=98.035 throughput=145.0K tks/s lr=0.0000856 time=127.16 INFO:root:[step 143999] mlm_loss=1.88750 mlm_acc=61.34900 nsp_loss=0.05524 nsp_acc=97.965 throughput=126.0K tks/s lr=0.0000856 time=128.93 INFO:root:[step 144249] mlm_loss=1.78002 mlm_acc=62.52072 nsp_loss=0.05376 nsp_acc=97.982 throughput=124.0K tks/s lr=0.0000856 time=110.67 INFO:root:[step 144499] mlm_loss=2.00669 mlm_acc=59.72284 nsp_loss=0.13429 nsp_acc=94.270 throughput=139.0K tks/s lr=0.0000856 time=135.20 INFO:root:[step 144749] mlm_loss=1.88928 mlm_acc=62.38787 nsp_loss=0.06021 nsp_acc=97.671 throughput=132.0K tks/s lr=0.0000855 time=131.23 INFO:root:[step 144999] mlm_loss=1.81856 mlm_acc=62.43015 nsp_loss=0.05550 nsp_acc=97.912 throughput=127.0K tks/s lr=0.0000855 time=110.61 INFO:root:[step 144999] Saving checkpoints to /home/ubuntu/ckpt-master/0144999.params, /home/ubuntu/ckpt-master/0144999.states. INFO:root:[step 145249] mlm_loss=1.92285 mlm_acc=61.33103 nsp_loss=0.05076 nsp_acc=98.138 throughput=117.0K tks/s lr=0.0000855 time=144.45 INFO:root:[step 145499] mlm_loss=2.05344 mlm_acc=58.89644 nsp_loss=0.08661 nsp_acc=96.487 throughput=136.0K tks/s lr=0.0000855 time=134.12 INFO:root:[step 145749] mlm_loss=1.90386 mlm_acc=60.83110 nsp_loss=0.06116 nsp_acc=97.687 throughput=140.0K tks/s lr=0.0000854 time=130.58 INFO:root:[step 145999] mlm_loss=2.06693 mlm_acc=59.69430 nsp_loss=0.06013 nsp_acc=97.658 throughput=154.0K tks/s lr=0.0000854 time=155.39 INFO:root:[step 146249] mlm_loss=2.12017 mlm_acc=58.33443 nsp_loss=0.07761 nsp_acc=96.868 throughput=146.0K tks/s lr=0.0000854 time=156.78 INFO:root:[step 146499] mlm_loss=1.97766 mlm_acc=60.78018 nsp_loss=0.05838 nsp_acc=97.791 throughput=141.0K tks/s lr=0.0000854 time=133.45 INFO:root:[step 146749] mlm_loss=1.97946 mlm_acc=60.08221 nsp_loss=0.07192 nsp_acc=97.132 throughput=148.0K tks/s lr=0.0000853 time=152.76 INFO:root:[step 146999] mlm_loss=1.80784 mlm_acc=62.61852 nsp_loss=0.05801 nsp_acc=97.896 throughput=125.0K tks/s lr=0.0000853 time=111.04 INFO:root:[step 147249] mlm_loss=1.97666 mlm_acc=59.19499 nsp_loss=0.13356 nsp_acc=94.363 throughput=151.0K tks/s lr=0.0000853 time=164.80 INFO:root:[step 147499] mlm_loss=1.89933 mlm_acc=61.80774 nsp_loss=0.05384 nsp_acc=97.980 throughput=134.0K tks/s lr=0.0000853 time=118.44 INFO:root:[step 147749] mlm_loss=1.98974 mlm_acc=59.41590 nsp_loss=0.13621 nsp_acc=94.261 throughput=153.0K tks/s lr=0.0000852 time=163.35 INFO:root:[step 147999] mlm_loss=1.98149 mlm_acc=59.18368 nsp_loss=0.08379 nsp_acc=96.704 throughput=147.0K tks/s lr=0.0000852 time=132.12 INFO:root:[step 148249] mlm_loss=2.02975 mlm_acc=60.53639 nsp_loss=0.04907 nsp_acc=98.162 throughput=145.0K tks/s lr=0.0000852 time=137.89 INFO:root:[step 148499] mlm_loss=2.04150 mlm_acc=60.39864 nsp_loss=0.05296 nsp_acc=97.999 throughput=140.0K tks/s lr=0.0000852 time=144.59 INFO:root:[step 148749] mlm_loss=1.99052 mlm_acc=58.60104 nsp_loss=0.06757 nsp_acc=97.536 throughput=143.0K tks/s lr=0.0000851 time=131.53 INFO:root:[step 148999] mlm_loss=1.86849 mlm_acc=61.61063 nsp_loss=0.05853 nsp_acc=97.834 throughput=125.0K tks/s lr=0.0000851 time=126.01 INFO:root:[step 149249] mlm_loss=1.76398 mlm_acc=62.81609 nsp_loss=0.05706 nsp_acc=97.933 throughput=121.0K tks/s lr=0.0000851 time=110.23 INFO:root:[step 149499] mlm_loss=1.79331 mlm_acc=62.60652 nsp_loss=0.06806 nsp_acc=97.446 throughput=110.0K tks/s lr=0.0000851 time=117.12 INFO:root:[step 149749] mlm_loss=1.77376 mlm_acc=62.69747 nsp_loss=0.05491 nsp_acc=98.002 throughput=120.0K tks/s lr=0.0000850 time=111.41 INFO:root:[step 149999] mlm_loss=1.92366 mlm_acc=61.40237 nsp_loss=0.05235 nsp_acc=98.098 throughput=134.0K tks/s lr=0.0000850 time=128.12 INFO:root:[step 149999] Saving checkpoints to /home/ubuntu/ckpt-master/0149999.params, /home/ubuntu/ckpt-master/0149999.states. INFO:root:[step 150249] mlm_loss=1.93287 mlm_acc=60.81020 nsp_loss=0.10992 nsp_acc=95.388 throughput=131.0K tks/s lr=0.0000850 time=163.04 INFO:root:[step 150499] mlm_loss=1.89397 mlm_acc=60.47055 nsp_loss=0.11787 nsp_acc=95.116 throughput=136.0K tks/s lr=0.0000850 time=135.45 INFO:root:[step 150749] mlm_loss=1.86532 mlm_acc=61.26094 nsp_loss=0.05402 nsp_acc=98.108 throughput=140.0K tks/s lr=0.0000849 time=119.26 INFO:root:[step 150999] mlm_loss=2.03287 mlm_acc=59.29060 nsp_loss=0.07870 nsp_acc=96.887 throughput=145.0K tks/s lr=0.0000849 time=146.25 INFO:root:[step 151249] mlm_loss=1.49280 mlm_acc=70.34648 nsp_loss=0.08462 nsp_acc=96.861 throughput=135.0K tks/s lr=0.0000849 time=134.88 INFO:root:[step 151499] mlm_loss=1.85588 mlm_acc=60.14516 nsp_loss=0.08964 nsp_acc=96.454 throughput=138.0K tks/s lr=0.0000849 time=139.77 INFO:root:[step 151749] mlm_loss=1.84228 mlm_acc=61.17008 nsp_loss=0.05767 nsp_acc=97.911 throughput=132.0K tks/s lr=0.0000848 time=128.67 INFO:root:[step 151999] mlm_loss=1.82896 mlm_acc=62.47888 nsp_loss=0.05533 nsp_acc=97.992 throughput=127.0K tks/s lr=0.0000848 time=112.44 INFO:root:[step 152249] mlm_loss=2.09665 mlm_acc=58.07985 nsp_loss=0.10347 nsp_acc=95.889 throughput=125.0K tks/s lr=0.0000848 time=127.28 INFO:root:[step 152499] mlm_loss=1.68040 mlm_acc=63.44213 nsp_loss=0.06078 nsp_acc=97.798 throughput=119.0K tks/s lr=0.0000848 time=109.49 INFO:root:[step 152749] mlm_loss=1.78319 mlm_acc=62.02458 nsp_loss=0.06013 nsp_acc=97.855 throughput=127.0K tks/s lr=0.0000847 time=127.90 INFO:root:[step 152999] mlm_loss=1.82965 mlm_acc=62.15198 nsp_loss=0.05825 nsp_acc=97.824 throughput=126.0K tks/s lr=0.0000847 time=110.38 INFO:root:[step 153249] mlm_loss=1.94380 mlm_acc=61.19929 nsp_loss=0.04881 nsp_acc=98.187 throughput=133.0K tks/s lr=0.0000847 time=130.72 INFO:root:[step 153499] mlm_loss=1.97555 mlm_acc=59.23905 nsp_loss=0.06949 nsp_acc=97.358 throughput=143.0K tks/s lr=0.0000847 time=137.64 INFO:root:[step 153749] mlm_loss=1.84128 mlm_acc=61.48229 nsp_loss=0.04986 nsp_acc=98.098 throughput=136.0K tks/s lr=0.0000846 time=124.09 INFO:root:[step 153999] mlm_loss=1.68914 mlm_acc=63.82381 nsp_loss=0.05007 nsp_acc=98.190 throughput=107.0K tks/s lr=0.0000846 time=114.22 INFO:root:[step 154249] mlm_loss=1.71186 mlm_acc=63.49035 nsp_loss=0.05426 nsp_acc=98.020 throughput=120.0K tks/s lr=0.0000846 time=107.09 INFO:root:[step 154499] mlm_loss=1.66505 mlm_acc=63.56010 nsp_loss=0.05375 nsp_acc=98.032 throughput=117.0K tks/s lr=0.0000846 time=107.53 INFO:root:[step 154749] mlm_loss=1.67560 mlm_acc=64.53883 nsp_loss=0.06772 nsp_acc=97.485 throughput=127.0K tks/s lr=0.0000845 time=127.74 INFO:root:[step 154999] mlm_loss=1.68911 mlm_acc=62.92396 nsp_loss=0.06284 nsp_acc=97.656 throughput=123.0K tks/s lr=0.0000845 time=109.99 INFO:root:[step 154999] Saving checkpoints to /home/ubuntu/ckpt-master/0154999.params, /home/ubuntu/ckpt-master/0154999.states. INFO:root:[step 155249] mlm_loss=1.84902 mlm_acc=61.62090 nsp_loss=0.04694 nsp_acc=98.271 throughput=117.0K tks/s lr=0.0000845 time=143.28 INFO:root:[step 155499] mlm_loss=1.89790 mlm_acc=61.50719 nsp_loss=0.04498 nsp_acc=98.310 throughput=139.0K tks/s lr=0.0000845 time=130.73 INFO:root:[step 155749] mlm_loss=2.06261 mlm_acc=58.61251 nsp_loss=0.10687 nsp_acc=95.662 throughput=158.0K tks/s lr=0.0000844 time=161.12 INFO:root:[step 155999] mlm_loss=1.79235 mlm_acc=62.40240 nsp_loss=0.06052 nsp_acc=97.746 throughput=128.0K tks/s lr=0.0000844 time=122.98 INFO:root:[step 156249] mlm_loss=2.02182 mlm_acc=59.73469 nsp_loss=0.09325 nsp_acc=96.117 throughput=148.0K tks/s lr=0.0000844 time=146.80 INFO:root:[step 156499] mlm_loss=1.87001 mlm_acc=62.03895 nsp_loss=0.04901 nsp_acc=98.192 throughput=126.0K tks/s lr=0.0000844 time=127.29 INFO:root:[step 156749] mlm_loss=1.74899 mlm_acc=61.65780 nsp_loss=0.06712 nsp_acc=97.432 throughput=144.0K tks/s lr=0.0000843 time=123.70 INFO:root:[step 156999] mlm_loss=1.75143 mlm_acc=61.94252 nsp_loss=0.07717 nsp_acc=97.045 throughput=126.0K tks/s lr=0.0000843 time=126.41 INFO:root:[step 157249] mlm_loss=1.93950 mlm_acc=60.35417 nsp_loss=0.10834 nsp_acc=95.413 throughput=153.0K tks/s lr=0.0000843 time=153.19 INFO:root:[step 157499] mlm_loss=1.95313 mlm_acc=61.41007 nsp_loss=0.04511 nsp_acc=98.327 throughput=139.0K tks/s lr=0.0000843 time=130.42 INFO:root:[step 157749] mlm_loss=1.98041 mlm_acc=60.96136 nsp_loss=0.04789 nsp_acc=98.175 throughput=141.0K tks/s lr=0.0000842 time=134.10 INFO:root:[step 157999] mlm_loss=2.03420 mlm_acc=59.55501 nsp_loss=0.08328 nsp_acc=96.696 throughput=159.0K tks/s lr=0.0000842 time=161.14 INFO:root:[step 158249] mlm_loss=1.79406 mlm_acc=62.55972 nsp_loss=0.04865 nsp_acc=98.220 throughput=120.0K tks/s lr=0.0000842 time=123.43 INFO:root:[step 158499] mlm_loss=1.89871 mlm_acc=60.03860 nsp_loss=0.09054 nsp_acc=96.218 throughput=145.0K tks/s lr=0.0000842 time=142.37 INFO:root:[step 158749] mlm_loss=2.01448 mlm_acc=59.50767 nsp_loss=0.10144 nsp_acc=95.911 throughput=157.0K tks/s lr=0.0000841 time=156.70 INFO:root:[step 158999] mlm_loss=1.83326 mlm_acc=61.42653 nsp_loss=0.05060 nsp_acc=98.144 throughput=136.0K tks/s lr=0.0000841 time=137.37 INFO:root:[step 159249] mlm_loss=1.90029 mlm_acc=60.47315 nsp_loss=0.05486 nsp_acc=97.907 throughput=143.0K tks/s lr=0.0000841 time=138.21 INFO:root:[step 159499] mlm_loss=1.81319 mlm_acc=61.36930 nsp_loss=0.05329 nsp_acc=98.074 throughput=130.0K tks/s lr=0.0000841 time=130.70 INFO:root:[step 159749] mlm_loss=1.93651 mlm_acc=61.72194 nsp_loss=0.04267 nsp_acc=98.418 throughput=136.0K tks/s lr=0.0000840 time=134.09 INFO:root:[step 159999] mlm_loss=1.83333 mlm_acc=62.60572 nsp_loss=0.05155 nsp_acc=98.125 throughput=136.0K tks/s lr=0.0000840 time=116.35 INFO:root:[step 159999] Saving checkpoints to /home/ubuntu/ckpt-master/0159999.params, /home/ubuntu/ckpt-master/0159999.states. INFO:root:[step 160249] mlm_loss=1.75741 mlm_acc=62.72741 nsp_loss=0.05959 nsp_acc=97.834 throughput=110.0K tks/s lr=0.0000840 time=135.51 INFO:root:[step 160499] mlm_loss=1.79007 mlm_acc=61.46621 nsp_loss=0.07011 nsp_acc=97.258 throughput=139.0K tks/s lr=0.0000840 time=127.24 INFO:root:[step 160749] mlm_loss=1.71876 mlm_acc=63.26895 nsp_loss=0.04988 nsp_acc=98.178 throughput=117.0K tks/s lr=0.0000839 time=118.53 INFO:root:[step 160999] mlm_loss=1.77924 mlm_acc=62.03493 nsp_loss=0.09064 nsp_acc=96.325 throughput=141.0K tks/s lr=0.0000839 time=138.75 INFO:root:[step 161249] mlm_loss=1.84484 mlm_acc=62.34899 nsp_loss=0.05253 nsp_acc=98.094 throughput=138.0K tks/s lr=0.0000839 time=119.80 INFO:root:[step 161499] mlm_loss=1.66270 mlm_acc=63.42012 nsp_loss=0.06539 nsp_acc=97.524 throughput=111.0K tks/s lr=0.0000839 time=104.95 INFO:root:[step 161749] mlm_loss=1.60647 mlm_acc=64.28044 nsp_loss=0.05990 nsp_acc=97.890 throughput=115.0K tks/s lr=0.0000838 time=116.54 INFO:root:[step 161999] mlm_loss=1.96774 mlm_acc=59.37087 nsp_loss=0.07617 nsp_acc=96.880 throughput=137.0K tks/s lr=0.0000838 time=135.40 INFO:root:[step 162249] mlm_loss=1.88146 mlm_acc=61.83002 nsp_loss=0.04843 nsp_acc=98.203 throughput=138.0K tks/s lr=0.0000838 time=121.06 INFO:root:[step 162749] mlm_loss=3.79964 mlm_acc=60.81176 nsp_loss=0.12934 nsp_acc=97.527 throughput=132.0K tks/s lr=0.0000837 time=263.18 INFO:root:[step 162999] mlm_loss=1.65230 mlm_acc=64.12607 nsp_loss=0.05615 nsp_acc=97.988 throughput=115.0K tks/s lr=0.0000837 time=107.15 INFO:root:[step 163249] mlm_loss=1.87579 mlm_acc=59.35295 nsp_loss=0.09173 nsp_acc=96.366 throughput=144.0K tks/s lr=0.0000837 time=140.72 INFO:root:[step 163499] mlm_loss=2.04178 mlm_acc=59.74463 nsp_loss=0.06249 nsp_acc=97.609 throughput=154.0K tks/s lr=0.0000837 time=154.38 INFO:root:[step 163749] mlm_loss=1.71816 mlm_acc=63.58442 nsp_loss=0.05187 nsp_acc=98.188 throughput=114.0K tks/s lr=0.0000836 time=118.48 INFO:root:[step 163999] mlm_loss=1.66825 mlm_acc=64.12610 nsp_loss=0.04929 nsp_acc=98.238 throughput=124.0K tks/s lr=0.0000836 time=108.43 INFO:root:[step 164249] mlm_loss=1.77375 mlm_acc=60.87393 nsp_loss=0.07474 nsp_acc=97.015 throughput=137.0K tks/s lr=0.0000836 time=138.42 INFO:root:[step 164499] mlm_loss=1.80652 mlm_acc=62.01657 nsp_loss=0.04907 nsp_acc=98.202 throughput=137.0K tks/s lr=0.0000836 time=127.42 INFO:root:[step 164749] mlm_loss=1.85508 mlm_acc=61.44959 nsp_loss=0.04771 nsp_acc=98.260 throughput=138.0K tks/s lr=0.0000835 time=123.21 INFO:root:[step 164999] mlm_loss=1.79610 mlm_acc=62.62019 nsp_loss=0.05373 nsp_acc=98.037 throughput=118.0K tks/s lr=0.0000835 time=121.04 INFO:root:[step 164999] Saving checkpoints to /home/ubuntu/ckpt-master/0164999.params, /home/ubuntu/ckpt-master/0164999.states. INFO:root:[step 165249] mlm_loss=1.87378 mlm_acc=61.94678 nsp_loss=0.04972 nsp_acc=98.144 throughput=118.0K tks/s lr=0.0000835 time=140.99 INFO:root:[step 165499] mlm_loss=1.97633 mlm_acc=59.95169 nsp_loss=0.11323 nsp_acc=95.282 throughput=147.0K tks/s lr=0.0000835 time=140.65 INFO:root:[step 165749] mlm_loss=2.10844 mlm_acc=58.52963 nsp_loss=0.06028 nsp_acc=97.683 throughput=154.0K tks/s lr=0.0000834 time=157.51 INFO:root:[step 165999] mlm_loss=1.94366 mlm_acc=60.92910 nsp_loss=0.06207 nsp_acc=97.568 throughput=143.0K tks/s lr=0.0000834 time=137.03 INFO:root:[step 166249] mlm_loss=2.05513 mlm_acc=58.50630 nsp_loss=0.14432 nsp_acc=93.878 throughput=159.0K tks/s lr=0.0000834 time=162.01 INFO:root:[step 166499] mlm_loss=1.86234 mlm_acc=61.94037 nsp_loss=0.05075 nsp_acc=98.148 throughput=127.0K tks/s lr=0.0000834 time=128.27 INFO:root:[step 166749] mlm_loss=1.84316 mlm_acc=60.91615 nsp_loss=0.11685 nsp_acc=95.097 throughput=128.0K tks/s lr=0.0000833 time=131.46 INFO:root:[step 166999] mlm_loss=1.76842 mlm_acc=62.31095 nsp_loss=0.04744 nsp_acc=98.250 throughput=131.0K tks/s lr=0.0000833 time=115.18 INFO:root:[step 167249] mlm_loss=1.83288 mlm_acc=62.35607 nsp_loss=0.04659 nsp_acc=98.285 throughput=127.0K tks/s lr=0.0000833 time=126.63 INFO:root:[step 167499] mlm_loss=1.89007 mlm_acc=60.44627 nsp_loss=0.05990 nsp_acc=97.750 throughput=141.0K tks/s lr=0.0000833 time=138.87 INFO:root:[step 167749] mlm_loss=1.71112 mlm_acc=63.64306 nsp_loss=0.04605 nsp_acc=98.346 throughput=124.0K tks/s lr=0.0000832 time=110.93 INFO:root:[step 167999] mlm_loss=1.84657 mlm_acc=62.40064 nsp_loss=0.04813 nsp_acc=98.217 throughput=133.0K tks/s lr=0.0000832 time=127.91 INFO:root:[step 168249] mlm_loss=1.91157 mlm_acc=62.00606 nsp_loss=0.04940 nsp_acc=98.119 throughput=140.0K tks/s lr=0.0000832 time=123.09 INFO:root:[step 168499] mlm_loss=1.84918 mlm_acc=61.61076 nsp_loss=0.08933 nsp_acc=96.402 throughput=134.0K tks/s lr=0.0000832 time=132.80 INFO:root:[step 168749] mlm_loss=2.06769 mlm_acc=59.01886 nsp_loss=0.07986 nsp_acc=96.817 throughput=149.0K tks/s lr=0.0000831 time=163.68 INFO:root:[step 168999] mlm_loss=1.80274 mlm_acc=63.01432 nsp_loss=0.05299 nsp_acc=98.063 throughput=128.0K tks/s lr=0.0000831 time=113.34 INFO:root:[step 169249] mlm_loss=1.91677 mlm_acc=61.68077 nsp_loss=0.04719 nsp_acc=98.220 throughput=139.0K tks/s lr=0.0000831 time=133.20 INFO:root:[step 169499] mlm_loss=1.95261 mlm_acc=61.56800 nsp_loss=0.04469 nsp_acc=98.305 throughput=140.0K tks/s lr=0.0000831 time=135.45 INFO:root:[step 169749] mlm_loss=1.51854 mlm_acc=69.41441 nsp_loss=0.07469 nsp_acc=97.301 throughput=138.0K tks/s lr=0.0000830 time=140.10 INFO:root:[step 169999] mlm_loss=1.80031 mlm_acc=62.61490 nsp_loss=0.04824 nsp_acc=98.260 throughput=136.0K tks/s lr=0.0000830 time=117.86 INFO:root:[step 169999] Saving checkpoints to /home/ubuntu/ckpt-master/0169999.params, /home/ubuntu/ckpt-master/0169999.states. INFO:root:[step 170249] mlm_loss=1.93867 mlm_acc=61.68784 nsp_loss=0.04831 nsp_acc=98.213 throughput=124.0K tks/s lr=0.0000830 time=147.83 INFO:root:[step 170499] mlm_loss=1.85804 mlm_acc=62.26245 nsp_loss=0.04732 nsp_acc=98.251 throughput=128.0K tks/s lr=0.0000830 time=126.42 INFO:root:[step 170749] mlm_loss=1.81315 mlm_acc=62.85492 nsp_loss=0.04573 nsp_acc=98.312 throughput=134.0K tks/s lr=0.0000829 time=116.10 INFO:root:[step 170999] mlm_loss=1.89511 mlm_acc=62.25815 nsp_loss=0.04764 nsp_acc=98.228 throughput=135.0K tks/s lr=0.0000829 time=132.33 INFO:root:[step 171249] mlm_loss=1.70123 mlm_acc=63.94033 nsp_loss=0.05126 nsp_acc=98.097 throughput=126.0K tks/s lr=0.0000829 time=112.03 INFO:root:[step 171499] mlm_loss=2.05178 mlm_acc=58.39990 nsp_loss=0.10408 nsp_acc=95.747 throughput=127.0K tks/s lr=0.0000829 time=131.46 INFO:root:[step 171749] mlm_loss=1.84417 mlm_acc=62.28331 nsp_loss=0.04557 nsp_acc=98.254 throughput=132.0K tks/s lr=0.0000828 time=131.60 INFO:root:[step 171999] mlm_loss=1.99499 mlm_acc=58.83279 nsp_loss=0.07054 nsp_acc=97.208 throughput=149.0K tks/s lr=0.0000828 time=144.17 INFO:root:[step 172249] mlm_loss=1.96768 mlm_acc=59.69392 nsp_loss=0.10866 nsp_acc=95.508 throughput=142.0K tks/s lr=0.0000828 time=145.93 INFO:root:[step 172499] mlm_loss=1.80929 mlm_acc=61.34118 nsp_loss=0.07265 nsp_acc=97.188 throughput=144.0K tks/s lr=0.0000828 time=135.66 INFO:root:[step 172749] mlm_loss=2.00642 mlm_acc=60.96177 nsp_loss=0.04617 nsp_acc=98.247 throughput=145.0K tks/s lr=0.0000827 time=143.95 INFO:root:[step 172999] mlm_loss=1.89912 mlm_acc=61.95117 nsp_loss=0.04469 nsp_acc=98.329 throughput=134.0K tks/s lr=0.0000827 time=136.87 INFO:root:[step 173249] mlm_loss=1.70251 mlm_acc=63.71176 nsp_loss=0.04991 nsp_acc=98.199 throughput=123.0K tks/s lr=0.0000827 time=108.82 INFO:root:[step 173499] mlm_loss=1.72328 mlm_acc=63.46977 nsp_loss=0.05113 nsp_acc=98.178 throughput=118.0K tks/s lr=0.0000827 time=121.04 INFO:root:[step 173749] mlm_loss=2.00790 mlm_acc=60.60076 nsp_loss=0.05408 nsp_acc=97.919 throughput=151.0K tks/s lr=0.0000826 time=145.37 INFO:root:[step 173999] mlm_loss=1.79102 mlm_acc=61.82804 nsp_loss=0.06222 nsp_acc=97.635 throughput=135.0K tks/s lr=0.0000826 time=124.16 INFO:root:[step 174249] mlm_loss=2.06115 mlm_acc=59.25122 nsp_loss=0.07770 nsp_acc=96.883 throughput=146.0K tks/s lr=0.0000826 time=159.77 INFO:root:[step 174499] mlm_loss=1.84652 mlm_acc=61.41983 nsp_loss=0.07466 nsp_acc=97.120 throughput=139.0K tks/s lr=0.0000826 time=127.43 INFO:root:[step 174749] mlm_loss=1.90080 mlm_acc=60.21118 nsp_loss=0.07061 nsp_acc=97.230 throughput=138.0K tks/s lr=0.0000825 time=135.90 INFO:root:[step 174999] mlm_loss=1.98746 mlm_acc=59.91838 nsp_loss=0.06944 nsp_acc=97.234 throughput=151.0K tks/s lr=0.0000825 time=161.15 INFO:root:[step 174999] Saving checkpoints to /home/ubuntu/ckpt-master/0174999.params, /home/ubuntu/ckpt-master/0174999.states. INFO:root:[step 175249] mlm_loss=1.77424 mlm_acc=62.22624 nsp_loss=0.07178 nsp_acc=97.147 throughput=128.0K tks/s lr=0.0000825 time=145.93 INFO:root:[step 175499] mlm_loss=1.84966 mlm_acc=61.35735 nsp_loss=0.11587 nsp_acc=94.998 throughput=134.0K tks/s lr=0.0000825 time=135.08 INFO:root:[step 175749] mlm_loss=1.80762 mlm_acc=60.49437 nsp_loss=0.07656 nsp_acc=97.061 throughput=140.0K tks/s lr=0.0000824 time=139.61 INFO:root:[step 175999] mlm_loss=1.64855 mlm_acc=64.54223 nsp_loss=0.05771 nsp_acc=97.867 throughput=121.0K tks/s lr=0.0000824 time=108.46 INFO:root:[step 176249] mlm_loss=1.99520 mlm_acc=60.02688 nsp_loss=0.08515 nsp_acc=96.595 throughput=147.0K tks/s lr=0.0000824 time=156.59 INFO:root:[step 176499] mlm_loss=1.91035 mlm_acc=61.30942 nsp_loss=0.09005 nsp_acc=96.247 throughput=140.0K tks/s lr=0.0000824 time=141.82 INFO:root:[step 176749] mlm_loss=1.67975 mlm_acc=64.10304 nsp_loss=0.05005 nsp_acc=98.172 throughput=120.0K tks/s lr=0.0000823 time=107.95 INFO:root:[step 176999] mlm_loss=1.66492 mlm_acc=64.09709 nsp_loss=0.05248 nsp_acc=98.097 throughput=117.0K tks/s lr=0.0000823 time=107.92 INFO:root:[step 177249] mlm_loss=1.67949 mlm_acc=63.97361 nsp_loss=0.05561 nsp_acc=97.902 throughput=116.0K tks/s lr=0.0000823 time=105.90 INFO:root:[step 177499] mlm_loss=1.91240 mlm_acc=61.39809 nsp_loss=0.04461 nsp_acc=98.333 throughput=138.0K tks/s lr=0.0000823 time=135.19 INFO:root:[step 177749] mlm_loss=1.68197 mlm_acc=63.55393 nsp_loss=0.05402 nsp_acc=98.030 throughput=115.0K tks/s lr=0.0000822 time=120.77 INFO:root:[step 177999] mlm_loss=1.54204 mlm_acc=68.48539 nsp_loss=0.06613 nsp_acc=97.610 throughput=135.0K tks/s lr=0.0000822 time=114.67 INFO:root:[step 178249] mlm_loss=1.55371 mlm_acc=67.41897 nsp_loss=0.05526 nsp_acc=98.021 throughput=128.0K tks/s lr=0.0000822 time=124.49 INFO:root:[step 178499] mlm_loss=1.99028 mlm_acc=60.65759 nsp_loss=0.04720 nsp_acc=98.237 throughput=147.0K tks/s lr=0.0000822 time=145.79 INFO:root:[step 178749] mlm_loss=1.65311 mlm_acc=61.77214 nsp_loss=0.06743 nsp_acc=97.541 throughput=132.0K tks/s lr=0.0000821 time=123.07 INFO:root:[step 178999] mlm_loss=1.89423 mlm_acc=59.91829 nsp_loss=0.11457 nsp_acc=95.322 throughput=149.0K tks/s lr=0.0000821 time=168.67 INFO:root:[step 179249] mlm_loss=1.76617 mlm_acc=63.63485 nsp_loss=0.04966 nsp_acc=98.179 throughput=128.0K tks/s lr=0.0000821 time=115.32 INFO:root:[step 179499] mlm_loss=1.83934 mlm_acc=61.12228 nsp_loss=0.11930 nsp_acc=94.995 throughput=148.0K tks/s lr=0.0000821 time=148.57 INFO:root:[step 179749] mlm_loss=1.86374 mlm_acc=61.60222 nsp_loss=0.05337 nsp_acc=98.054 throughput=138.0K tks/s lr=0.0000820 time=135.91 INFO:root:[step 179999] mlm_loss=1.88616 mlm_acc=60.14007 nsp_loss=0.07065 nsp_acc=97.257 throughput=141.0K tks/s lr=0.0000820 time=138.98 INFO:root:[step 179999] Saving checkpoints to /home/ubuntu/ckpt-master/0179999.params, /home/ubuntu/ckpt-master/0179999.states. INFO:root:[step 180249] mlm_loss=1.66482 mlm_acc=64.03412 nsp_loss=0.04959 nsp_acc=98.238 throughput=106.0K tks/s lr=0.0000820 time=125.19 INFO:root:[step 180499] mlm_loss=1.79748 mlm_acc=62.92185 nsp_loss=0.04915 nsp_acc=98.167 throughput=123.0K tks/s lr=0.0000820 time=124.94 INFO:root:[step 180749] mlm_loss=1.87024 mlm_acc=60.87773 nsp_loss=0.09578 nsp_acc=96.139 throughput=149.0K tks/s lr=0.0000819 time=145.84 INFO:root:[step 180999] mlm_loss=1.95746 mlm_acc=60.99464 nsp_loss=0.05857 nsp_acc=97.785 throughput=146.0K tks/s lr=0.0000819 time=145.46 INFO:root:[step 181249] mlm_loss=1.82688 mlm_acc=62.87872 nsp_loss=0.04824 nsp_acc=98.263 throughput=127.0K tks/s lr=0.0000819 time=121.84 INFO:root:[step 181499] mlm_loss=1.87380 mlm_acc=62.28385 nsp_loss=0.04869 nsp_acc=98.238 throughput=136.0K tks/s lr=0.0000819 time=120.33 INFO:root:[step 181749] mlm_loss=1.71457 mlm_acc=63.67762 nsp_loss=0.05195 nsp_acc=98.138 throughput=114.0K tks/s lr=0.0000818 time=117.26 INFO:root:[step 181999] mlm_loss=1.71087 mlm_acc=63.07863 nsp_loss=0.09511 nsp_acc=96.125 throughput=127.0K tks/s lr=0.0000818 time=113.95 INFO:root:[step 182249] mlm_loss=1.89521 mlm_acc=61.58556 nsp_loss=0.10243 nsp_acc=95.663 throughput=133.0K tks/s lr=0.0000818 time=134.93 INFO:root:[step 182499] mlm_loss=1.69909 mlm_acc=63.87204 nsp_loss=0.05330 nsp_acc=98.099 throughput=119.0K tks/s lr=0.0000818 time=106.89 INFO:root:[step 182749] mlm_loss=1.69033 mlm_acc=63.55535 nsp_loss=0.05592 nsp_acc=97.941 throughput=122.0K tks/s lr=0.0000817 time=109.67 INFO:root:[step 182999] mlm_loss=1.88013 mlm_acc=61.93429 nsp_loss=0.04844 nsp_acc=98.174 throughput=134.0K tks/s lr=0.0000817 time=132.05 INFO:root:[step 183249] mlm_loss=1.74420 mlm_acc=63.39315 nsp_loss=0.05074 nsp_acc=98.101 throughput=118.0K tks/s lr=0.0000817 time=122.45 INFO:root:[step 183499] mlm_loss=1.76306 mlm_acc=61.79060 nsp_loss=0.07986 nsp_acc=96.794 throughput=141.0K tks/s lr=0.0000817 time=120.56 INFO:root:[step 183749] mlm_loss=1.76423 mlm_acc=62.79806 nsp_loss=0.05885 nsp_acc=97.791 throughput=124.0K tks/s lr=0.0000816 time=127.14 INFO:root:[step 183999] mlm_loss=1.82079 mlm_acc=62.74641 nsp_loss=0.05057 nsp_acc=98.149 throughput=138.0K tks/s lr=0.0000816 time=120.37 INFO:root:[step 184249] mlm_loss=1.98030 mlm_acc=60.94519 nsp_loss=0.04574 nsp_acc=98.367 throughput=140.0K tks/s lr=0.0000816 time=154.30 INFO:root:[step 184499] mlm_loss=1.74894 mlm_acc=62.16273 nsp_loss=0.07353 nsp_acc=97.153 throughput=146.0K tks/s lr=0.0000816 time=127.18 INFO:root:[step 184749] mlm_loss=1.82624 mlm_acc=62.07452 nsp_loss=0.05079 nsp_acc=98.134 throughput=130.0K tks/s lr=0.0000815 time=129.87 INFO:root:[step 184999] mlm_loss=1.98020 mlm_acc=58.89864 nsp_loss=0.09045 nsp_acc=96.417 throughput=151.0K tks/s lr=0.0000815 time=161.98 INFO:root:[step 184999] Saving checkpoints to /home/ubuntu/ckpt-master/0184999.params, /home/ubuntu/ckpt-master/0184999.states. INFO:root:[step 185249] mlm_loss=2.01929 mlm_acc=60.32760 nsp_loss=0.07366 nsp_acc=97.128 throughput=135.0K tks/s lr=0.0000815 time=148.98 INFO:root:[step 185499] mlm_loss=1.94729 mlm_acc=61.48193 nsp_loss=0.04509 nsp_acc=98.309 throughput=137.0K tks/s lr=0.0000815 time=149.36 INFO:root:[step 185749] mlm_loss=1.72013 mlm_acc=63.70889 nsp_loss=0.05141 nsp_acc=98.115 throughput=126.0K tks/s lr=0.0000814 time=110.33 INFO:root:[step 185999] mlm_loss=1.80186 mlm_acc=62.11504 nsp_loss=0.09511 nsp_acc=96.144 throughput=141.0K tks/s lr=0.0000814 time=140.60 INFO:root:[step 186249] mlm_loss=1.61916 mlm_acc=64.57493 nsp_loss=0.05255 nsp_acc=98.081 throughput=117.0K tks/s lr=0.0000814 time=108.80 INFO:root:[step 186499] mlm_loss=1.85098 mlm_acc=61.70806 nsp_loss=0.06243 nsp_acc=97.554 throughput=136.0K tks/s lr=0.0000814 time=128.52 INFO:root:[step 186749] mlm_loss=1.76290 mlm_acc=61.91798 nsp_loss=0.07040 nsp_acc=97.393 throughput=132.0K tks/s lr=0.0000813 time=122.29 INFO:root:[step 186999] mlm_loss=1.79376 mlm_acc=60.44220 nsp_loss=0.05901 nsp_acc=97.761 throughput=134.0K tks/s lr=0.0000813 time=136.65 INFO:root:[step 187249] mlm_loss=1.84839 mlm_acc=61.99981 nsp_loss=0.08951 nsp_acc=96.328 throughput=131.0K tks/s lr=0.0000813 time=128.57 INFO:root:[step 187499] mlm_loss=1.82488 mlm_acc=61.93086 nsp_loss=0.09229 nsp_acc=96.163 throughput=137.0K tks/s lr=0.0000813 time=122.18 INFO:root:[step 187749] mlm_loss=1.89178 mlm_acc=61.94359 nsp_loss=0.04575 nsp_acc=98.319 throughput=133.0K tks/s lr=0.0000812 time=133.88 INFO:root:[step 187999] mlm_loss=1.87281 mlm_acc=62.25552 nsp_loss=0.04614 nsp_acc=98.294 throughput=129.0K tks/s lr=0.0000812 time=130.18 INFO:root:[step 188249] mlm_loss=1.87164 mlm_acc=62.06210 nsp_loss=0.04335 nsp_acc=98.387 throughput=138.0K tks/s lr=0.0000812 time=132.06 INFO:root:[step 188499] mlm_loss=1.83494 mlm_acc=62.51635 nsp_loss=0.04920 nsp_acc=98.189 throughput=127.0K tks/s lr=0.0000812 time=129.40 INFO:root:[step 188749] mlm_loss=1.70181 mlm_acc=63.92922 nsp_loss=0.05121 nsp_acc=98.133 throughput=123.0K tks/s lr=0.0000811 time=109.73 INFO:root:[step 188999] mlm_loss=1.81203 mlm_acc=61.82182 nsp_loss=0.09282 nsp_acc=96.246 throughput=134.0K tks/s lr=0.0000811 time=132.80 INFO:root:[step 189249] mlm_loss=1.65722 mlm_acc=64.05405 nsp_loss=0.06003 nsp_acc=97.796 throughput=118.0K tks/s lr=0.0000811 time=109.44 INFO:root:[step 189499] mlm_loss=1.89155 mlm_acc=59.98207 nsp_loss=0.08787 nsp_acc=96.628 throughput=129.0K tks/s lr=0.0000811 time=116.63 INFO:root:[step 189749] mlm_loss=1.75774 mlm_acc=62.78908 nsp_loss=0.05811 nsp_acc=97.852 throughput=113.0K tks/s lr=0.0000810 time=119.60 INFO:root:[step 189999] mlm_loss=1.60565 mlm_acc=65.03336 nsp_loss=0.05439 nsp_acc=98.104 throughput=120.0K tks/s lr=0.0000810 time=110.70 INFO:root:[step 189999] Saving checkpoints to /home/ubuntu/ckpt-master/0189999.params, /home/ubuntu/ckpt-master/0189999.states. INFO:root:[step 190249] mlm_loss=1.63328 mlm_acc=64.55249 nsp_loss=0.05769 nsp_acc=97.887 throughput=106.0K tks/s lr=0.0000810 time=123.51 INFO:root:[step 190499] mlm_loss=1.93274 mlm_acc=61.27859 nsp_loss=0.09901 nsp_acc=96.035 throughput=137.0K tks/s lr=0.0000810 time=135.53 INFO:root:[step 190749] mlm_loss=1.98779 mlm_acc=59.89275 nsp_loss=0.10176 nsp_acc=95.948 throughput=150.0K tks/s lr=0.0000809 time=148.57 INFO:root:[step 190999] mlm_loss=1.66067 mlm_acc=63.75630 nsp_loss=0.05224 nsp_acc=98.073 throughput=112.0K tks/s lr=0.0000809 time=119.64 INFO:root:[step 191249] mlm_loss=1.63321 mlm_acc=64.36867 nsp_loss=0.05570 nsp_acc=97.913 throughput=116.0K tks/s lr=0.0000809 time=108.28 INFO:root:[step 191499] mlm_loss=1.81665 mlm_acc=60.78613 nsp_loss=0.08163 nsp_acc=96.774 throughput=133.0K tks/s lr=0.0000809 time=132.20 INFO:root:[step 191749] mlm_loss=1.70085 mlm_acc=64.03757 nsp_loss=0.04857 nsp_acc=98.193 throughput=125.0K tks/s lr=0.0000808 time=116.57 INFO:root:[step 191999] mlm_loss=1.80481 mlm_acc=62.15794 nsp_loss=0.04699 nsp_acc=98.300 throughput=131.0K tks/s lr=0.0000808 time=129.19 INFO:root:[step 192249] mlm_loss=1.84652 mlm_acc=62.38583 nsp_loss=0.04683 nsp_acc=98.272 throughput=134.0K tks/s lr=0.0000808 time=128.88 INFO:root:[step 192499] mlm_loss=1.68426 mlm_acc=63.84221 nsp_loss=0.05275 nsp_acc=98.119 throughput=121.0K tks/s lr=0.0000808 time=111.80 INFO:root:[step 192749] mlm_loss=1.73980 mlm_acc=62.19105 nsp_loss=0.06602 nsp_acc=97.509 throughput=137.0K tks/s lr=0.0000807 time=132.80 INFO:root:[step 192999] mlm_loss=1.87212 mlm_acc=62.56369 nsp_loss=0.04736 nsp_acc=98.237 throughput=132.0K tks/s lr=0.0000807 time=127.15 INFO:root:[step 193249] mlm_loss=2.00478 mlm_acc=59.56770 nsp_loss=0.06075 nsp_acc=97.698 throughput=147.0K tks/s lr=0.0000807 time=152.45 INFO:root:[step 193499] mlm_loss=1.67711 mlm_acc=64.09404 nsp_loss=0.05179 nsp_acc=98.113 throughput=122.0K tks/s lr=0.0000807 time=108.97 INFO:root:[step 193749] mlm_loss=1.76056 mlm_acc=63.21691 nsp_loss=0.04990 nsp_acc=98.212 throughput=123.0K tks/s lr=0.0000806 time=126.08 INFO:root:[step 193999] mlm_loss=1.47212 mlm_acc=65.80848 nsp_loss=0.06408 nsp_acc=97.657 throughput=112.0K tks/s lr=0.0000806 time=104.52 INFO:root:[step 194249] mlm_loss=1.66911 mlm_acc=64.00073 nsp_loss=0.05308 nsp_acc=98.073 throughput=125.0K tks/s lr=0.0000806 time=110.23 INFO:root:[step 194499] mlm_loss=1.89424 mlm_acc=60.66032 nsp_loss=0.06256 nsp_acc=97.591 throughput=145.0K tks/s lr=0.0000806 time=141.45 INFO:root:[step 194749] mlm_loss=1.85491 mlm_acc=62.75748 nsp_loss=0.05041 nsp_acc=98.174 throughput=128.0K tks/s lr=0.0000805 time=127.32 INFO:root:[step 194999] mlm_loss=1.91440 mlm_acc=61.44773 nsp_loss=0.08104 nsp_acc=96.787 throughput=151.0K tks/s lr=0.0000805 time=147.84 INFO:root:[step 194999] Saving checkpoints to /home/ubuntu/ckpt-master/0194999.params, /home/ubuntu/ckpt-master/0194999.states. INFO:root:[step 195249] mlm_loss=1.89239 mlm_acc=62.15460 nsp_loss=0.04843 nsp_acc=98.222 throughput=128.0K tks/s lr=0.0000805 time=155.38 INFO:root:[step 195499] mlm_loss=1.78752 mlm_acc=61.71436 nsp_loss=0.07905 nsp_acc=96.893 throughput=138.0K tks/s lr=0.0000805 time=138.09 INFO:root:[step 195749] mlm_loss=1.70174 mlm_acc=63.79075 nsp_loss=0.05109 nsp_acc=98.154 throughput=127.0K tks/s lr=0.0000804 time=113.24 INFO:root:[step 195999] mlm_loss=1.81963 mlm_acc=62.12752 nsp_loss=0.05609 nsp_acc=97.794 throughput=132.0K tks/s lr=0.0000804 time=129.24 INFO:root:[step 196249] mlm_loss=2.03705 mlm_acc=59.37255 nsp_loss=0.07589 nsp_acc=97.067 throughput=155.0K tks/s lr=0.0000804 time=156.12 INFO:root:[step 196499] mlm_loss=1.75507 mlm_acc=62.49489 nsp_loss=0.05618 nsp_acc=97.917 throughput=127.0K tks/s lr=0.0000804 time=123.99 INFO:root:[step 196749] mlm_loss=1.88569 mlm_acc=61.66193 nsp_loss=0.05268 nsp_acc=97.995 throughput=138.0K tks/s lr=0.0000803 time=139.35 INFO:root:[step 196999] mlm_loss=1.70633 mlm_acc=66.20669 nsp_loss=0.06340 nsp_acc=97.631 throughput=145.0K tks/s lr=0.0000803 time=139.72 INFO:root:[step 197249] mlm_loss=1.86162 mlm_acc=62.52723 nsp_loss=0.05114 nsp_acc=98.080 throughput=135.0K tks/s lr=0.0000803 time=131.02 INFO:root:[step 197499] mlm_loss=1.86719 mlm_acc=61.91100 nsp_loss=0.04592 nsp_acc=98.238 throughput=139.0K tks/s lr=0.0000803 time=140.99 INFO:root:[step 197749] mlm_loss=1.74909 mlm_acc=63.19753 nsp_loss=0.04870 nsp_acc=98.254 throughput=134.0K tks/s lr=0.0000802 time=115.41 INFO:root:[step 197999] mlm_loss=1.78953 mlm_acc=63.25141 nsp_loss=0.04589 nsp_acc=98.309 throughput=123.0K tks/s lr=0.0000802 time=126.21 INFO:root:[step 198249] mlm_loss=1.94621 mlm_acc=60.46303 nsp_loss=0.09606 nsp_acc=96.091 throughput=151.0K tks/s lr=0.0000802 time=148.76 INFO:root:[step 198499] mlm_loss=1.88440 mlm_acc=60.93792 nsp_loss=0.07785 nsp_acc=96.857 throughput=136.0K tks/s lr=0.0000802 time=129.92 INFO:root:[step 198749] mlm_loss=2.04935 mlm_acc=58.92132 nsp_loss=0.09561 nsp_acc=95.985 throughput=158.0K tks/s lr=0.0000801 time=164.41 INFO:root:[step 198999] mlm_loss=1.90254 mlm_acc=61.07527 nsp_loss=0.06306 nsp_acc=97.535 throughput=142.0K tks/s lr=0.0000801 time=139.93 INFO:root:[step 199249] mlm_loss=1.82504 mlm_acc=61.79693 nsp_loss=0.05596 nsp_acc=97.913 throughput=134.0K tks/s lr=0.0000801 time=137.72 INFO:root:[step 199499] mlm_loss=1.92335 mlm_acc=60.28315 nsp_loss=0.08224 nsp_acc=96.717 throughput=133.0K tks/s lr=0.0000801 time=132.36 INFO:root:[step 199749] mlm_loss=1.83997 mlm_acc=62.77791 nsp_loss=0.04804 nsp_acc=98.201 throughput=136.0K tks/s lr=0.0000800 time=119.73 INFO:root:[step 199999] mlm_loss=1.74943 mlm_acc=61.74171 nsp_loss=0.08778 nsp_acc=96.597 throughput=135.0K tks/s lr=0.0000800 time=136.23 INFO:root:[step 199999] Saving checkpoints to /home/ubuntu/ckpt-master/0199999.params, /home/ubuntu/ckpt-master/0199999.states. INFO:root:[step 200249] mlm_loss=1.67438 mlm_acc=64.35402 nsp_loss=0.05340 nsp_acc=98.039 throughput=103.0K tks/s lr=0.0000800 time=121.08 INFO:root:[step 200499] mlm_loss=1.79950 mlm_acc=62.45296 nsp_loss=0.04956 nsp_acc=98.228 throughput=131.0K tks/s lr=0.0000800 time=128.12 INFO:root:[step 200749] mlm_loss=1.79561 mlm_acc=61.41879 nsp_loss=0.08206 nsp_acc=96.750 throughput=137.0K tks/s lr=0.0000799 time=134.65 INFO:root:[step 200999] mlm_loss=1.77447 mlm_acc=62.83590 nsp_loss=0.05092 nsp_acc=98.112 throughput=134.0K tks/s lr=0.0000799 time=123.50 INFO:root:[step 201249] mlm_loss=1.89962 mlm_acc=61.17239 nsp_loss=0.07403 nsp_acc=97.088 throughput=146.0K tks/s lr=0.0000799 time=152.47 INFO:root:[step 201499] mlm_loss=1.78677 mlm_acc=62.97277 nsp_loss=0.05106 nsp_acc=98.109 throughput=136.0K tks/s lr=0.0000799 time=117.20 INFO:root:[step 201749] mlm_loss=1.79499 mlm_acc=62.14257 nsp_loss=0.08498 nsp_acc=96.504 throughput=131.0K tks/s lr=0.0000798 time=128.54 INFO:root:[step 201999] mlm_loss=1.88475 mlm_acc=61.88596 nsp_loss=0.07022 nsp_acc=97.212 throughput=137.0K tks/s lr=0.0000798 time=134.88 INFO:root:[step 202249] mlm_loss=2.02438 mlm_acc=58.95341 nsp_loss=0.08246 nsp_acc=96.759 throughput=153.0K tks/s lr=0.0000798 time=152.71 INFO:root:[step 202499] mlm_loss=2.00339 mlm_acc=59.42746 nsp_loss=0.10410 nsp_acc=95.679 throughput=155.0K tks/s lr=0.0000798 time=173.35 INFO:root:[step 202749] mlm_loss=2.10894 mlm_acc=58.75363 nsp_loss=0.09051 nsp_acc=96.455 throughput=153.0K tks/s lr=0.0000797 time=152.04 INFO:root:[step 202999] mlm_loss=1.75729 mlm_acc=62.21288 nsp_loss=0.06654 nsp_acc=97.497 throughput=124.0K tks/s lr=0.0000797 time=128.15 INFO:root:[step 203249] mlm_loss=1.77964 mlm_acc=63.61649 nsp_loss=0.04589 nsp_acc=98.363 throughput=132.0K tks/s lr=0.0000797 time=117.81 INFO:root:[step 203499] mlm_loss=1.84884 mlm_acc=62.37096 nsp_loss=0.06977 nsp_acc=97.265 throughput=136.0K tks/s lr=0.0000797 time=130.57 INFO:root:[step 203749] mlm_loss=1.83284 mlm_acc=61.74331 nsp_loss=0.11878 nsp_acc=94.927 throughput=151.0K tks/s lr=0.0000796 time=155.32 INFO:root:[step 203999] mlm_loss=1.82771 mlm_acc=61.73387 nsp_loss=0.07799 nsp_acc=96.947 throughput=139.0K tks/s lr=0.0000796 time=139.19 INFO:root:[step 204249] mlm_loss=1.69439 mlm_acc=63.58166 nsp_loss=0.05160 nsp_acc=98.083 throughput=131.0K tks/s lr=0.0000796 time=111.54 INFO:root:[step 204499] mlm_loss=2.04603 mlm_acc=59.26939 nsp_loss=0.11001 nsp_acc=95.591 throughput=147.0K tks/s lr=0.0000796 time=146.16 INFO:root:[step 204749] mlm_loss=1.73519 mlm_acc=62.77988 nsp_loss=0.05671 nsp_acc=97.899 throughput=124.0K tks/s lr=0.0000795 time=123.24 INFO:root:[step 204999] mlm_loss=1.75608 mlm_acc=63.11689 nsp_loss=0.04975 nsp_acc=98.209 throughput=130.0K tks/s lr=0.0000795 time=117.25 INFO:root:[step 204999] Saving checkpoints to /home/ubuntu/ckpt-master/0204999.params, /home/ubuntu/ckpt-master/0204999.states. INFO:root:[step 205249] mlm_loss=2.04602 mlm_acc=58.94917 nsp_loss=0.09471 nsp_acc=96.183 throughput=112.0K tks/s lr=0.0000795 time=142.31 INFO:root:[step 205499] mlm_loss=1.70095 mlm_acc=64.16612 nsp_loss=0.05309 nsp_acc=98.057 throughput=124.0K tks/s lr=0.0000795 time=108.95 INFO:root:[step 205749] mlm_loss=1.71128 mlm_acc=63.68796 nsp_loss=0.07949 nsp_acc=96.807 throughput=122.0K tks/s lr=0.0000794 time=122.61 INFO:root:[step 205999] mlm_loss=1.83478 mlm_acc=62.47753 nsp_loss=0.09318 nsp_acc=96.142 throughput=138.0K tks/s lr=0.0000794 time=122.64 INFO:root:[step 206249] mlm_loss=1.43237 mlm_acc=66.04402 nsp_loss=0.06496 nsp_acc=97.682 throughput=99.0K tks/s lr=0.0000794 time=107.43 INFO:root:[step 206499] mlm_loss=1.74311 mlm_acc=61.99989 nsp_loss=0.08887 nsp_acc=96.436 throughput=145.0K tks/s lr=0.0000794 time=133.33 INFO:root:[step 206749] mlm_loss=1.83196 mlm_acc=62.75112 nsp_loss=0.04938 nsp_acc=98.169 throughput=129.0K tks/s lr=0.0000793 time=126.55 INFO:root:[step 206999] mlm_loss=1.83438 mlm_acc=62.60528 nsp_loss=0.05461 nsp_acc=97.960 throughput=136.0K tks/s lr=0.0000793 time=129.48 INFO:root:[step 207249] mlm_loss=1.86860 mlm_acc=61.17612 nsp_loss=0.06922 nsp_acc=97.404 throughput=141.0K tks/s lr=0.0000793 time=138.93 INFO:root:[step 207499] mlm_loss=2.03577 mlm_acc=59.15242 nsp_loss=0.08563 nsp_acc=96.600 throughput=155.0K tks/s lr=0.0000793 time=160.13 INFO:root:[step 207749] mlm_loss=1.91853 mlm_acc=61.30890 nsp_loss=0.09068 nsp_acc=96.319 throughput=150.0K tks/s lr=0.0000792 time=147.79 INFO:root:[step 207999] mlm_loss=1.89945 mlm_acc=62.33293 nsp_loss=0.04776 nsp_acc=98.235 throughput=137.0K tks/s lr=0.0000792 time=133.22 INFO:root:[step 208249] mlm_loss=1.79966 mlm_acc=63.27618 nsp_loss=0.04944 nsp_acc=98.186 throughput=132.0K tks/s lr=0.0000792 time=127.32 INFO:root:[step 208499] mlm_loss=1.76487 mlm_acc=62.83256 nsp_loss=0.05084 nsp_acc=98.103 throughput=131.0K tks/s lr=0.0000792 time=120.08 INFO:root:[step 208749] mlm_loss=1.62981 mlm_acc=64.52389 nsp_loss=0.05791 nsp_acc=97.903 throughput=113.0K tks/s lr=0.0000791 time=117.23 INFO:root:[step 208999] mlm_loss=1.74345 mlm_acc=63.56334 nsp_loss=0.04992 nsp_acc=98.178 throughput=130.0K tks/s lr=0.0000791 time=115.74 INFO:root:[step 209249] mlm_loss=1.70341 mlm_acc=64.09374 nsp_loss=0.04739 nsp_acc=98.265 throughput=118.0K tks/s lr=0.0000791 time=116.13 INFO:root:[step 209499] mlm_loss=1.87050 mlm_acc=62.41099 nsp_loss=0.04431 nsp_acc=98.340 throughput=142.0K tks/s lr=0.0000791 time=136.97 INFO:root:[step 209749] mlm_loss=1.85869 mlm_acc=62.72659 nsp_loss=0.04551 nsp_acc=98.333 throughput=142.0K tks/s lr=0.0000790 time=121.84 INFO:root:[step 209999] mlm_loss=1.73303 mlm_acc=63.62062 nsp_loss=0.04966 nsp_acc=98.239 throughput=125.0K tks/s lr=0.0000790 time=120.73 INFO:root:[step 209999] Saving checkpoints to /home/ubuntu/ckpt-master/0209999.params, /home/ubuntu/ckpt-master/0209999.states. INFO:root:[step 210249] mlm_loss=1.82840 mlm_acc=62.66695 nsp_loss=0.04791 nsp_acc=98.238 throughput=122.0K tks/s lr=0.0000790 time=136.65 INFO:root:[step 210499] mlm_loss=1.86111 mlm_acc=60.35280 nsp_loss=0.06797 nsp_acc=97.361 throughput=140.0K tks/s lr=0.0000790 time=137.48 INFO:root:[step 210749] mlm_loss=1.80874 mlm_acc=63.14278 nsp_loss=0.04756 nsp_acc=98.214 throughput=128.0K tks/s lr=0.0000789 time=122.71 INFO:root:[step 210999] mlm_loss=1.92150 mlm_acc=61.14998 nsp_loss=0.07770 nsp_acc=96.974 throughput=156.0K tks/s lr=0.0000789 time=156.06 INFO:root:[step 211249] mlm_loss=1.88433 mlm_acc=62.46250 nsp_loss=0.05191 nsp_acc=98.039 throughput=138.0K tks/s lr=0.0000789 time=134.26 INFO:root:[step 211499] mlm_loss=2.05257 mlm_acc=58.57007 nsp_loss=0.07071 nsp_acc=97.299 throughput=148.0K tks/s lr=0.0000789 time=171.31 INFO:root:[step 211749] mlm_loss=1.81186 mlm_acc=61.30599 nsp_loss=0.07296 nsp_acc=97.127 throughput=139.0K tks/s lr=0.0000788 time=119.02 INFO:root:[step 211999] mlm_loss=1.80926 mlm_acc=62.93599 nsp_loss=0.05657 nsp_acc=97.787 throughput=128.0K tks/s lr=0.0000788 time=124.70 INFO:root:[step 212249] mlm_loss=1.86575 mlm_acc=61.15497 nsp_loss=0.08253 nsp_acc=96.777 throughput=141.0K tks/s lr=0.0000788 time=141.42 INFO:root:[step 212499] mlm_loss=1.83213 mlm_acc=62.42103 nsp_loss=0.04853 nsp_acc=98.207 throughput=135.0K tks/s lr=0.0000788 time=129.37 INFO:root:[step 212749] mlm_loss=1.88368 mlm_acc=62.25243 nsp_loss=0.04301 nsp_acc=98.416 throughput=141.0K tks/s lr=0.0000787 time=140.67 INFO:root:[step 212999] mlm_loss=1.72051 mlm_acc=63.54327 nsp_loss=0.04798 nsp_acc=98.225 throughput=133.0K tks/s lr=0.0000787 time=115.50 INFO:root:[step 213249] mlm_loss=2.02759 mlm_acc=59.43241 nsp_loss=0.09359 nsp_acc=96.124 throughput=153.0K tks/s lr=0.0000787 time=171.28 INFO:root:[step 213499] mlm_loss=1.88400 mlm_acc=61.70690 nsp_loss=0.10754 nsp_acc=95.580 throughput=151.0K tks/s lr=0.0000787 time=149.04 INFO:root:[step 213749] mlm_loss=1.87227 mlm_acc=60.80917 nsp_loss=0.09966 nsp_acc=95.961 throughput=150.0K tks/s lr=0.0000786 time=151.26 INFO:root:[step 213999] mlm_loss=1.87673 mlm_acc=62.47873 nsp_loss=0.04644 nsp_acc=98.282 throughput=140.0K tks/s lr=0.0000786 time=132.89 INFO:root:[step 214249] mlm_loss=1.79734 mlm_acc=63.34858 nsp_loss=0.04762 nsp_acc=98.248 throughput=128.0K tks/s lr=0.0000786 time=123.55 INFO:root:[step 214499] mlm_loss=1.82668 mlm_acc=62.31742 nsp_loss=0.04863 nsp_acc=98.176 throughput=140.0K tks/s lr=0.0000786 time=124.11 INFO:root:[step 214749] mlm_loss=1.95703 mlm_acc=59.75421 nsp_loss=0.12498 nsp_acc=94.903 throughput=145.0K tks/s lr=0.0000785 time=163.38 INFO:root:[step 214999] mlm_loss=1.67571 mlm_acc=64.22068 nsp_loss=0.05099 nsp_acc=98.091 throughput=122.0K tks/s lr=0.0000785 time=110.31 INFO:root:[step 214999] Saving checkpoints to /home/ubuntu/ckpt-master/0214999.params, /home/ubuntu/ckpt-master/0214999.states. INFO:root:[step 215249] mlm_loss=1.85827 mlm_acc=62.34575 nsp_loss=0.04609 nsp_acc=98.297 throughput=126.0K tks/s lr=0.0000785 time=146.51 INFO:root:[step 215499] mlm_loss=1.71426 mlm_acc=63.60533 nsp_loss=0.04875 nsp_acc=98.199 throughput=131.0K tks/s lr=0.0000785 time=113.84 INFO:root:[step 215749] mlm_loss=1.78859 mlm_acc=62.62621 nsp_loss=0.04885 nsp_acc=98.193 throughput=132.0K tks/s lr=0.0000784 time=130.71 INFO:root:[step 215999] mlm_loss=1.78389 mlm_acc=63.37519 nsp_loss=0.04783 nsp_acc=98.244 throughput=124.0K tks/s lr=0.0000784 time=125.44 INFO:root:[step 216249] mlm_loss=1.75912 mlm_acc=62.30833 nsp_loss=0.07955 nsp_acc=96.880 throughput=138.0K tks/s lr=0.0000784 time=134.92 INFO:root:[step 216499] mlm_loss=1.70066 mlm_acc=63.96608 nsp_loss=0.05202 nsp_acc=98.077 throughput=130.0K tks/s lr=0.0000784 time=111.89 INFO:root:[step 216749] mlm_loss=1.95203 mlm_acc=60.65728 nsp_loss=0.10762 nsp_acc=95.509 throughput=144.0K tks/s lr=0.0000783 time=145.07 INFO:root:[step 216999] mlm_loss=1.51927 mlm_acc=65.05175 nsp_loss=0.05538 nsp_acc=98.045 throughput=113.0K tks/s lr=0.0000783 time=108.67 INFO:root:[step 217249] mlm_loss=1.81765 mlm_acc=62.67935 nsp_loss=0.04709 nsp_acc=98.291 throughput=139.0K tks/s lr=0.0000783 time=133.60 INFO:root:[step 217499] mlm_loss=1.84977 mlm_acc=63.01809 nsp_loss=0.04420 nsp_acc=98.347 throughput=136.0K tks/s lr=0.0000783 time=129.99 INFO:root:[step 217749] mlm_loss=1.77747 mlm_acc=63.57341 nsp_loss=0.05080 nsp_acc=98.168 throughput=125.0K tks/s lr=0.0000782 time=130.42 INFO:root:[step 217999] mlm_loss=1.64987 mlm_acc=63.74819 nsp_loss=0.08591 nsp_acc=96.444 throughput=128.0K tks/s lr=0.0000782 time=111.08 INFO:root:[step 218249] mlm_loss=1.80883 mlm_acc=62.44493 nsp_loss=0.08488 nsp_acc=96.509 throughput=133.0K tks/s lr=0.0000782 time=133.53 INFO:root:[step 218499] mlm_loss=1.83390 mlm_acc=61.25975 nsp_loss=0.08983 nsp_acc=96.436 throughput=149.0K tks/s lr=0.0000782 time=129.51 INFO:root:[step 218749] mlm_loss=1.65526 mlm_acc=64.52713 nsp_loss=0.04978 nsp_acc=98.212 throughput=116.0K tks/s lr=0.0000781 time=118.98 INFO:root:[step 218999] mlm_loss=1.87888 mlm_acc=61.48412 nsp_loss=0.07494 nsp_acc=97.099 throughput=150.0K tks/s lr=0.0000781 time=149.02 INFO:root:[step 219249] mlm_loss=1.70347 mlm_acc=64.29933 nsp_loss=0.05000 nsp_acc=98.195 throughput=125.0K tks/s lr=0.0000781 time=127.19 INFO:root:[step 219499] mlm_loss=1.79089 mlm_acc=62.73329 nsp_loss=0.05036 nsp_acc=98.194 throughput=141.0K tks/s lr=0.0000781 time=120.14 INFO:root:[step 219749] mlm_loss=1.83243 mlm_acc=62.73444 nsp_loss=0.04601 nsp_acc=98.304 throughput=134.0K tks/s lr=0.0000780 time=131.76 INFO:root:[step 219999] mlm_loss=1.63491 mlm_acc=64.88929 nsp_loss=0.05198 nsp_acc=98.148 throughput=120.0K tks/s lr=0.0000780 time=107.54 INFO:root:[step 219999] Saving checkpoints to /home/ubuntu/ckpt-master/0219999.params, /home/ubuntu/ckpt-master/0219999.states. INFO:root:[step 220249] mlm_loss=1.60312 mlm_acc=64.91907 nsp_loss=0.05414 nsp_acc=98.036 throughput=94.0K tks/s lr=0.0000780 time=130.31 INFO:root:[step 220499] mlm_loss=1.70374 mlm_acc=63.15560 nsp_loss=0.09738 nsp_acc=95.953 throughput=134.0K tks/s lr=0.0000780 time=117.05 INFO:root:[step 220749] mlm_loss=1.66944 mlm_acc=64.06680 nsp_loss=0.05904 nsp_acc=97.824 throughput=122.0K tks/s lr=0.0000779 time=124.28 INFO:root:[step 220999] mlm_loss=1.75794 mlm_acc=64.06168 nsp_loss=0.05026 nsp_acc=98.117 throughput=131.0K tks/s lr=0.0000779 time=114.09 INFO:root:[step 221249] mlm_loss=1.87577 mlm_acc=62.69493 nsp_loss=0.04535 nsp_acc=98.322 throughput=136.0K tks/s lr=0.0000779 time=138.68 INFO:root:[step 221499] mlm_loss=1.64722 mlm_acc=64.55170 nsp_loss=0.05431 nsp_acc=98.064 throughput=123.0K tks/s lr=0.0000779 time=113.09 INFO:root:[step 221749] mlm_loss=1.78118 mlm_acc=63.74283 nsp_loss=0.04771 nsp_acc=98.278 throughput=125.0K tks/s lr=0.0000778 time=126.87 INFO:root:[step 221999] mlm_loss=1.67573 mlm_acc=64.14211 nsp_loss=0.05219 nsp_acc=98.165 throughput=120.0K tks/s lr=0.0000778 time=119.23 INFO:root:[step 222249] mlm_loss=1.83975 mlm_acc=63.33471 nsp_loss=0.04781 nsp_acc=98.256 throughput=141.0K tks/s lr=0.0000778 time=144.47 INFO:root:[step 222499] mlm_loss=1.68244 mlm_acc=64.51828 nsp_loss=0.04992 nsp_acc=98.152 throughput=126.0K tks/s lr=0.0000778 time=111.51 INFO:root:[step 222749] mlm_loss=1.96807 mlm_acc=60.43824 nsp_loss=0.08245 nsp_acc=96.790 throughput=141.0K tks/s lr=0.0000777 time=139.88 INFO:root:[step 222999] mlm_loss=1.89143 mlm_acc=62.66877 nsp_loss=0.04771 nsp_acc=98.206 throughput=138.0K tks/s lr=0.0000777 time=134.06 INFO:root:[step 223249] mlm_loss=1.75365 mlm_acc=63.55397 nsp_loss=0.04729 nsp_acc=98.232 throughput=134.0K tks/s lr=0.0000777 time=117.16 INFO:root:[step 223499] mlm_loss=1.57382 mlm_acc=65.20362 nsp_loss=0.05223 nsp_acc=98.135 throughput=107.0K tks/s lr=0.0000777 time=116.29 INFO:root:[step 223749] mlm_loss=1.69238 mlm_acc=64.28618 nsp_loss=0.05204 nsp_acc=98.063 throughput=122.0K tks/s lr=0.0000776 time=106.80 INFO:root:[step 223999] mlm_loss=1.68480 mlm_acc=63.20926 nsp_loss=0.07818 nsp_acc=96.915 throughput=139.0K tks/s lr=0.0000776 time=140.30 INFO:root:[step 224249] mlm_loss=1.62614 mlm_acc=65.01961 nsp_loss=0.05257 nsp_acc=98.078 throughput=121.0K tks/s lr=0.0000776 time=108.13 INFO:root:[step 224499] mlm_loss=1.61081 mlm_acc=64.90878 nsp_loss=0.05070 nsp_acc=98.246 throughput=111.0K tks/s lr=0.0000776 time=117.43 INFO:root:[step 224749] mlm_loss=1.58032 mlm_acc=64.21897 nsp_loss=0.09372 nsp_acc=96.141 throughput=121.0K tks/s lr=0.0000775 time=105.88 INFO:root:[step 224999] mlm_loss=1.89711 mlm_acc=61.65264 nsp_loss=0.10419 nsp_acc=95.654 throughput=140.0K tks/s lr=0.0000775 time=133.09 INFO:root:[step 224999] Saving checkpoints to /home/ubuntu/ckpt-master/0224999.params, /home/ubuntu/ckpt-master/0224999.states. INFO:root:[step 225249] mlm_loss=1.74778 mlm_acc=60.96141 nsp_loss=0.07386 nsp_acc=97.180 throughput=119.0K tks/s lr=0.0000775 time=143.19 INFO:root:[step 225499] mlm_loss=1.78821 mlm_acc=63.15516 nsp_loss=0.05153 nsp_acc=98.073 throughput=128.0K tks/s lr=0.0000775 time=127.19 INFO:root:[step 225749] mlm_loss=1.73358 mlm_acc=64.83478 nsp_loss=0.05752 nsp_acc=97.797 throughput=134.0K tks/s lr=0.0000774 time=129.57 INFO:root:[step 225999] mlm_loss=1.43456 mlm_acc=70.85363 nsp_loss=0.07693 nsp_acc=97.214 throughput=137.0K tks/s lr=0.0000774 time=124.86 INFO:root:[step 226249] mlm_loss=1.67311 mlm_acc=64.43896 nsp_loss=0.04921 nsp_acc=98.218 throughput=117.0K tks/s lr=0.0000774 time=116.29 INFO:root:[step 226499] mlm_loss=1.87683 mlm_acc=61.47811 nsp_loss=0.11985 nsp_acc=94.764 throughput=142.0K tks/s lr=0.0000774 time=142.03 INFO:root:[step 226749] mlm_loss=1.84075 mlm_acc=61.61278 nsp_loss=0.07431 nsp_acc=97.099 throughput=136.0K tks/s lr=0.0000773 time=117.72 INFO:root:[step 226999] mlm_loss=1.59659 mlm_acc=66.29460 nsp_loss=0.09219 nsp_acc=96.531 throughput=156.0K tks/s lr=0.0000773 time=155.77 INFO:root:[step 227249] mlm_loss=1.61031 mlm_acc=64.80872 nsp_loss=0.05941 nsp_acc=97.788 throughput=116.0K tks/s lr=0.0000773 time=118.09 INFO:root:[step 227499] mlm_loss=1.79506 mlm_acc=61.69024 nsp_loss=0.06022 nsp_acc=97.733 throughput=130.0K tks/s lr=0.0000773 time=136.97 INFO:root:[step 227749] mlm_loss=1.66109 mlm_acc=64.73814 nsp_loss=0.04976 nsp_acc=98.251 throughput=121.0K tks/s lr=0.0000772 time=106.98 INFO:root:[step 227999] mlm_loss=1.68854 mlm_acc=64.27791 nsp_loss=0.04851 nsp_acc=98.275 throughput=125.0K tks/s lr=0.0000772 time=111.68 INFO:root:[step 228249] mlm_loss=1.91286 mlm_acc=60.75880 nsp_loss=0.06039 nsp_acc=97.729 throughput=148.0K tks/s lr=0.0000772 time=145.55 INFO:root:[step 228499] mlm_loss=1.73653 mlm_acc=62.62502 nsp_loss=0.05315 nsp_acc=98.050 throughput=133.0K tks/s lr=0.0000772 time=128.60 INFO:root:[step 228749] mlm_loss=1.89397 mlm_acc=61.41044 nsp_loss=0.09672 nsp_acc=95.999 throughput=153.0K tks/s lr=0.0000771 time=154.01 INFO:root:[step 228999] mlm_loss=1.83792 mlm_acc=62.67722 nsp_loss=0.04543 nsp_acc=98.314 throughput=132.0K tks/s lr=0.0000771 time=128.10 INFO:root:[step 229249] mlm_loss=1.83211 mlm_acc=62.72050 nsp_loss=0.05796 nsp_acc=97.834 throughput=123.0K tks/s lr=0.0000771 time=125.35 INFO:root:[step 229499] mlm_loss=2.21294 mlm_acc=57.02952 nsp_loss=0.12218 nsp_acc=95.013 throughput=147.0K tks/s lr=0.0000771 time=132.53 INFO:root:[step 229749] mlm_loss=1.92630 mlm_acc=61.63685 nsp_loss=0.05045 nsp_acc=98.123 throughput=144.0K tks/s lr=0.0000770 time=149.67 INFO:root:[step 229999] mlm_loss=1.70165 mlm_acc=63.12797 nsp_loss=0.06553 nsp_acc=97.452 throughput=140.0K tks/s lr=0.0000770 time=128.05 INFO:root:[step 229999] Saving checkpoints to /home/ubuntu/ckpt-master/0229999.params, /home/ubuntu/ckpt-master/0229999.states. INFO:root:[step 230249] mlm_loss=1.67831 mlm_acc=64.49993 nsp_loss=0.04664 nsp_acc=98.263 throughput=104.0K tks/s lr=0.0000770 time=135.23 INFO:root:[step 230499] mlm_loss=1.86386 mlm_acc=61.03306 nsp_loss=0.07964 nsp_acc=96.842 throughput=140.0K tks/s lr=0.0000770 time=122.78 INFO:root:[step 230749] mlm_loss=1.74041 mlm_acc=63.27314 nsp_loss=0.03476 nsp_acc=98.755 throughput=133.0K tks/s lr=0.0000769 time=128.13 INFO:root:[step 230999] mlm_loss=1.79036 mlm_acc=63.28776 nsp_loss=0.03037 nsp_acc=98.932 throughput=138.0K tks/s lr=0.0000769 time=131.62 INFO:root:[step 231249] mlm_loss=1.84076 mlm_acc=61.69858 nsp_loss=0.14235 nsp_acc=93.916 throughput=146.0K tks/s lr=0.0000769 time=143.50 INFO:root:[step 231499] mlm_loss=1.81662 mlm_acc=62.72136 nsp_loss=0.05016 nsp_acc=98.125 throughput=137.0K tks/s lr=0.0000769 time=138.60 INFO:root:[step 231749] mlm_loss=1.80323 mlm_acc=62.39318 nsp_loss=0.08877 nsp_acc=96.411 throughput=134.0K tks/s lr=0.0000768 time=137.82 INFO:root:[step 231999] mlm_loss=1.56948 mlm_acc=65.06329 nsp_loss=0.05393 nsp_acc=98.036 throughput=122.0K tks/s lr=0.0000768 time=111.38 INFO:root:[step 232249] mlm_loss=1.68125 mlm_acc=61.91012 nsp_loss=0.06484 nsp_acc=97.568 throughput=139.0K tks/s lr=0.0000768 time=135.96 INFO:root:[step 232499] mlm_loss=1.78610 mlm_acc=63.02402 nsp_loss=0.04119 nsp_acc=98.500 throughput=137.0K tks/s lr=0.0000768 time=125.93 INFO:root:[step 232749] mlm_loss=1.88845 mlm_acc=60.32385 nsp_loss=0.09135 nsp_acc=96.395 throughput=153.0K tks/s lr=0.0000767 time=160.20 INFO:root:[step 232999] mlm_loss=1.72830 mlm_acc=63.78045 nsp_loss=0.04137 nsp_acc=98.452 throughput=130.0K tks/s lr=0.0000767 time=127.36 INFO:root:[step 233249] mlm_loss=1.57392 mlm_acc=64.63090 nsp_loss=0.07944 nsp_acc=96.835 throughput=126.0K tks/s lr=0.0000767 time=109.17 INFO:root:[step 233499] mlm_loss=1.86047 mlm_acc=61.70197 nsp_loss=0.13520 nsp_acc=94.228 throughput=144.0K tks/s lr=0.0000767 time=146.36 INFO:root:[step 233749] mlm_loss=1.80521 mlm_acc=63.09632 nsp_loss=0.04267 nsp_acc=98.409 throughput=129.0K tks/s lr=0.0000766 time=130.37 INFO:root:[step 233999] mlm_loss=1.64548 mlm_acc=64.60381 nsp_loss=0.04590 nsp_acc=98.280 throughput=124.0K tks/s lr=0.0000766 time=109.36 INFO:root:[step 234249] mlm_loss=1.84203 mlm_acc=61.99229 nsp_loss=0.04401 nsp_acc=98.375 throughput=144.0K tks/s lr=0.0000766 time=137.50 INFO:root:[step 234499] mlm_loss=1.88111 mlm_acc=60.95663 nsp_loss=0.09226 nsp_acc=96.235 throughput=160.0K tks/s lr=0.0000766 time=164.03 INFO:root:[step 234749] mlm_loss=1.50014 mlm_acc=66.33079 nsp_loss=0.06987 nsp_acc=97.382 throughput=106.0K tks/s lr=0.0000765 time=118.03 INFO:root:[step 234999] mlm_loss=1.67309 mlm_acc=62.74097 nsp_loss=0.06982 nsp_acc=97.305 throughput=137.0K tks/s lr=0.0000765 time=138.42 INFO:root:[step 234999] Saving checkpoints to /home/ubuntu/ckpt-master/0234999.params, /home/ubuntu/ckpt-master/0234999.states. INFO:root:[step 235249] mlm_loss=1.67017 mlm_acc=63.23018 nsp_loss=0.06408 nsp_acc=97.496 throughput=112.0K tks/s lr=0.0000765 time=125.14 INFO:root:[step 235499] mlm_loss=1.92924 mlm_acc=59.89216 nsp_loss=0.11135 nsp_acc=95.361 throughput=142.0K tks/s lr=0.0000765 time=144.63 INFO:root:[step 235749] mlm_loss=1.74512 mlm_acc=62.30463 nsp_loss=0.06696 nsp_acc=97.389 throughput=133.0K tks/s lr=0.0000764 time=135.39 INFO:root:[step 235999] mlm_loss=1.54175 mlm_acc=64.71204 nsp_loss=0.05769 nsp_acc=97.820 throughput=120.0K tks/s lr=0.0000764 time=107.54 INFO:root:[step 236249] mlm_loss=1.65639 mlm_acc=64.40062 nsp_loss=0.04382 nsp_acc=98.452 throughput=127.0K tks/s lr=0.0000764 time=111.59 INFO:root:[step 236499] mlm_loss=1.82317 mlm_acc=62.91767 nsp_loss=0.04206 nsp_acc=98.453 throughput=135.0K tks/s lr=0.0000764 time=128.00 INFO:root:[step 236749] mlm_loss=1.86665 mlm_acc=62.15653 nsp_loss=0.06425 nsp_acc=97.387 throughput=147.0K tks/s lr=0.0000763 time=143.42 INFO:root:[step 236999] mlm_loss=1.94898 mlm_acc=60.39330 nsp_loss=0.08953 nsp_acc=96.371 throughput=158.0K tks/s lr=0.0000763 time=176.72 INFO:root:[step 237249] mlm_loss=1.79933 mlm_acc=63.00938 nsp_loss=0.04342 nsp_acc=98.400 throughput=131.0K tks/s lr=0.0000763 time=130.49 INFO:root:[step 237499] mlm_loss=1.56884 mlm_acc=65.31761 nsp_loss=0.04574 nsp_acc=98.357 throughput=124.0K tks/s lr=0.0000763 time=107.23 INFO:root:[step 237749] mlm_loss=1.76561 mlm_acc=63.65049 nsp_loss=0.04494 nsp_acc=98.404 throughput=136.0K tks/s lr=0.0000762 time=117.99 INFO:root:[step 237999] mlm_loss=1.69944 mlm_acc=64.44133 nsp_loss=0.04408 nsp_acc=98.448 throughput=125.0K tks/s lr=0.0000762 time=122.64 INFO:root:[step 238249] mlm_loss=1.81576 mlm_acc=63.07964 nsp_loss=0.04312 nsp_acc=98.412 throughput=132.0K tks/s lr=0.0000762 time=128.45 INFO:root:[step 238499] mlm_loss=1.66532 mlm_acc=64.59902 nsp_loss=0.04454 nsp_acc=98.407 throughput=124.0K tks/s lr=0.0000762 time=111.62 INFO:root:[step 238749] mlm_loss=1.72868 mlm_acc=62.57207 nsp_loss=0.10787 nsp_acc=95.485 throughput=149.0K tks/s lr=0.0000761 time=145.21 INFO:root:[step 238999] mlm_loss=1.94500 mlm_acc=60.42648 nsp_loss=0.06925 nsp_acc=97.271 throughput=152.0K tks/s lr=0.0000761 time=165.81 INFO:root:[step 239249] mlm_loss=1.96449 mlm_acc=59.60845 nsp_loss=0.11327 nsp_acc=95.301 throughput=152.0K tks/s lr=0.0000761 time=156.15 INFO:root:[step 239499] mlm_loss=2.02551 mlm_acc=59.74312 nsp_loss=0.12372 nsp_acc=94.849 throughput=145.0K tks/s lr=0.0000761 time=146.50 INFO:root:[step 239749] mlm_loss=1.85688 mlm_acc=62.52776 nsp_loss=0.08436 nsp_acc=96.501 throughput=139.0K tks/s lr=0.0000760 time=138.19 INFO:root:[step 239999] mlm_loss=1.74781 mlm_acc=63.63580 nsp_loss=0.03912 nsp_acc=98.569 throughput=135.0K tks/s lr=0.0000760 time=118.92 INFO:root:[step 239999] Saving checkpoints to /home/ubuntu/ckpt-master/0239999.params, /home/ubuntu/ckpt-master/0239999.states. INFO:root:[step 240249] mlm_loss=1.91477 mlm_acc=60.86260 nsp_loss=0.05411 nsp_acc=97.954 throughput=135.0K tks/s lr=0.0000760 time=161.20 INFO:root:[step 240499] mlm_loss=1.86544 mlm_acc=62.73144 nsp_loss=0.04609 nsp_acc=98.327 throughput=136.0K tks/s lr=0.0000760 time=130.96 INFO:root:[step 240749] mlm_loss=1.83093 mlm_acc=62.78273 nsp_loss=0.07410 nsp_acc=97.046 throughput=146.0K tks/s lr=0.0000759 time=149.01 INFO:root:[step 240999] mlm_loss=1.57740 mlm_acc=65.63776 nsp_loss=0.05215 nsp_acc=98.155 throughput=124.0K tks/s lr=0.0000759 time=121.35 INFO:root:[step 241249] mlm_loss=1.73631 mlm_acc=63.14563 nsp_loss=0.07912 nsp_acc=96.916 throughput=146.0K tks/s lr=0.0000759 time=148.94 INFO:root:[step 241499] mlm_loss=1.56897 mlm_acc=65.49688 nsp_loss=0.04724 nsp_acc=98.338 throughput=115.0K tks/s lr=0.0000759 time=107.83 INFO:root:[step 241749] mlm_loss=1.63807 mlm_acc=64.49236 nsp_loss=0.05015 nsp_acc=98.180 throughput=118.0K tks/s lr=0.0000758 time=118.62 INFO:root:[step 241999] mlm_loss=1.79162 mlm_acc=63.57348 nsp_loss=0.04119 nsp_acc=98.474 throughput=139.0K tks/s lr=0.0000758 time=118.82 INFO:root:[step 242249] mlm_loss=1.91892 mlm_acc=60.50814 nsp_loss=0.10556 nsp_acc=95.665 throughput=148.0K tks/s lr=0.0000758 time=166.97 INFO:root:[step 242499] mlm_loss=1.58961 mlm_acc=64.85467 nsp_loss=0.04336 nsp_acc=98.435 throughput=124.0K tks/s lr=0.0000758 time=106.60 INFO:root:[step 242749] mlm_loss=1.65843 mlm_acc=64.47639 nsp_loss=0.04599 nsp_acc=98.322 throughput=127.0K tks/s lr=0.0000757 time=114.27 INFO:root:[step 242999] mlm_loss=1.77441 mlm_acc=62.67459 nsp_loss=0.06918 nsp_acc=97.207 throughput=145.0K tks/s lr=0.0000757 time=137.16 INFO:root:[step 243249] mlm_loss=1.79766 mlm_acc=62.06250 nsp_loss=0.05618 nsp_acc=97.834 throughput=137.0K tks/s lr=0.0000757 time=136.18 INFO:root:[step 243499] mlm_loss=1.77586 mlm_acc=63.19987 nsp_loss=0.06595 nsp_acc=97.330 throughput=129.0K tks/s lr=0.0000757 time=125.24 INFO:root:[step 243749] mlm_loss=1.87281 mlm_acc=61.90113 nsp_loss=0.08384 nsp_acc=96.407 throughput=144.0K tks/s lr=0.0000756 time=141.75 INFO:root:[step 243999] mlm_loss=1.77636 mlm_acc=63.49845 nsp_loss=0.04306 nsp_acc=98.395 throughput=134.0K tks/s lr=0.0000756 time=118.28 INFO:root:[step 244249] mlm_loss=1.65447 mlm_acc=64.58047 nsp_loss=0.04535 nsp_acc=98.386 throughput=117.0K tks/s lr=0.0000756 time=121.41 INFO:root:[step 244499] mlm_loss=1.75761 mlm_acc=63.81714 nsp_loss=0.04601 nsp_acc=98.353 throughput=133.0K tks/s lr=0.0000756 time=115.34 INFO:root:[step 244749] mlm_loss=1.72418 mlm_acc=64.22932 nsp_loss=0.04253 nsp_acc=98.466 throughput=126.0K tks/s lr=0.0000755 time=127.79 INFO:root:[step 244999] mlm_loss=1.56194 mlm_acc=65.44741 nsp_loss=0.04875 nsp_acc=98.217 throughput=116.0K tks/s lr=0.0000755 time=105.52 INFO:root:[step 244999] Saving checkpoints to /home/ubuntu/ckpt-master/0244999.params, /home/ubuntu/ckpt-master/0244999.states. INFO:root:[step 245249] mlm_loss=1.62414 mlm_acc=65.06643 nsp_loss=0.04485 nsp_acc=98.352 throughput=106.0K tks/s lr=0.0000755 time=122.43 INFO:root:[step 245499] mlm_loss=1.71900 mlm_acc=62.61081 nsp_loss=0.06755 nsp_acc=97.416 throughput=137.0K tks/s lr=0.0000755 time=139.58 INFO:root:[step 245749] mlm_loss=1.80352 mlm_acc=61.67661 nsp_loss=0.08810 nsp_acc=96.516 throughput=150.0K tks/s lr=0.0000754 time=168.89 INFO:root:[step 245999] mlm_loss=1.64604 mlm_acc=64.71773 nsp_loss=0.04969 nsp_acc=98.244 throughput=122.0K tks/s lr=0.0000754 time=109.67 INFO:root:[step 246249] mlm_loss=1.81728 mlm_acc=61.88124 nsp_loss=0.05591 nsp_acc=97.912 throughput=146.0K tks/s lr=0.0000754 time=141.39 INFO:root:[step 246499] mlm_loss=1.69238 mlm_acc=64.13126 nsp_loss=0.05600 nsp_acc=97.865 throughput=118.0K tks/s lr=0.0000754 time=123.71 INFO:root:[step 246749] mlm_loss=1.55172 mlm_acc=64.40703 nsp_loss=0.05829 nsp_acc=97.924 throughput=127.0K tks/s lr=0.0000753 time=108.37 INFO:root:[step 246999] mlm_loss=1.69663 mlm_acc=63.81760 nsp_loss=0.04826 nsp_acc=98.177 throughput=125.0K tks/s lr=0.0000753 time=125.32 INFO:root:[step 247249] mlm_loss=1.89763 mlm_acc=60.82744 nsp_loss=0.07095 nsp_acc=97.188 throughput=137.0K tks/s lr=0.0000753 time=129.18 INFO:root:[step 247499] mlm_loss=1.95094 mlm_acc=60.05762 nsp_loss=0.12839 nsp_acc=94.493 throughput=149.0K tks/s lr=0.0000753 time=147.82 INFO:root:[step 247749] mlm_loss=1.76575 mlm_acc=63.09864 nsp_loss=0.05100 nsp_acc=98.117 throughput=131.0K tks/s lr=0.0000752 time=131.43 INFO:root:[step 247999] mlm_loss=1.78690 mlm_acc=62.22163 nsp_loss=0.10356 nsp_acc=95.774 throughput=142.0K tks/s lr=0.0000752 time=139.01 INFO:root:[step 248249] mlm_loss=1.88237 mlm_acc=62.15162 nsp_loss=0.04672 nsp_acc=98.233 throughput=144.0K tks/s lr=0.0000752 time=143.36 INFO:root:[step 248499] mlm_loss=1.70865 mlm_acc=64.71649 nsp_loss=0.04800 nsp_acc=98.215 throughput=124.0K tks/s lr=0.0000752 time=122.64 INFO:root:[step 248749] mlm_loss=1.65471 mlm_acc=64.58145 nsp_loss=0.04765 nsp_acc=98.284 throughput=120.0K tks/s lr=0.0000751 time=109.88 INFO:root:[step 248999] mlm_loss=1.75101 mlm_acc=63.82522 nsp_loss=0.04353 nsp_acc=98.310 throughput=132.0K tks/s lr=0.0000751 time=125.41 INFO:root:[step 249249] mlm_loss=1.74026 mlm_acc=63.98750 nsp_loss=0.04257 nsp_acc=98.432 throughput=135.0K tks/s lr=0.0000751 time=118.99 INFO:root:[step 249499] mlm_loss=1.95399 mlm_acc=60.37950 nsp_loss=0.07125 nsp_acc=97.191 throughput=135.0K tks/s lr=0.0000751 time=134.14 INFO:root:[step 249749] mlm_loss=1.63844 mlm_acc=64.48416 nsp_loss=0.04645 nsp_acc=98.311 throughput=128.0K tks/s lr=0.0000750 time=114.84 INFO:root:[step 249999] mlm_loss=1.85442 mlm_acc=60.95037 nsp_loss=0.08497 nsp_acc=96.588 throughput=149.0K tks/s lr=0.0000750 time=167.70 INFO:root:[step 249999] Saving checkpoints to /home/ubuntu/ckpt-master/0249999.params, /home/ubuntu/ckpt-master/0249999.states. INFO:root:[step 250249] mlm_loss=1.62374 mlm_acc=65.02435 nsp_loss=0.04443 nsp_acc=98.382 throughput=111.0K tks/s lr=0.0000750 time=123.41 INFO:root:[step 250499] mlm_loss=1.81474 mlm_acc=61.32844 nsp_loss=0.05611 nsp_acc=97.938 throughput=142.0K tks/s lr=0.0000750 time=141.58 INFO:root:[step 250749] mlm_loss=1.77311 mlm_acc=63.63395 nsp_loss=0.04125 nsp_acc=98.502 throughput=133.0K tks/s lr=0.0000749 time=127.11 INFO:root:[step 250999] mlm_loss=1.68353 mlm_acc=64.22317 nsp_loss=0.04372 nsp_acc=98.433 throughput=129.0K tks/s lr=0.0000749 time=118.12 INFO:root:[step 251249] mlm_loss=2.07431 mlm_acc=59.05489 nsp_loss=0.09886 nsp_acc=96.151 throughput=135.0K tks/s lr=0.0000749 time=141.87 INFO:root:[step 251499] mlm_loss=1.72034 mlm_acc=63.10175 nsp_loss=0.07753 nsp_acc=96.933 throughput=137.0K tks/s lr=0.0000749 time=134.25 INFO:root:[step 251749] mlm_loss=1.97647 mlm_acc=60.74257 nsp_loss=0.08304 nsp_acc=96.739 throughput=143.0K tks/s lr=0.0000748 time=144.25 INFO:root:[step 251999] mlm_loss=1.72682 mlm_acc=62.81365 nsp_loss=0.06145 nsp_acc=97.696 throughput=125.0K tks/s lr=0.0000748 time=127.00 INFO:root:[step 252249] mlm_loss=1.66121 mlm_acc=64.11749 nsp_loss=0.04354 nsp_acc=98.410 throughput=135.0K tks/s lr=0.0000748 time=117.49 INFO:root:[step 252499] mlm_loss=1.66128 mlm_acc=64.78569 nsp_loss=0.04585 nsp_acc=98.394 throughput=119.0K tks/s lr=0.0000748 time=119.99 INFO:root:[step 252749] mlm_loss=1.68494 mlm_acc=64.30852 nsp_loss=0.04956 nsp_acc=98.188 throughput=124.0K tks/s lr=0.0000747 time=112.87 INFO:root:[step 252999] mlm_loss=1.72659 mlm_acc=63.53030 nsp_loss=0.04335 nsp_acc=98.391 throughput=131.0K tks/s lr=0.0000747 time=126.34 INFO:root:[step 253249] mlm_loss=1.76755 mlm_acc=63.29253 nsp_loss=0.04311 nsp_acc=98.443 throughput=141.0K tks/s lr=0.0000747 time=120.51 INFO:root:[step 253499] mlm_loss=1.36854 mlm_acc=67.03579 nsp_loss=0.05537 nsp_acc=98.019 throughput=102.0K tks/s lr=0.0000747 time=103.38 INFO:root:[step 253749] mlm_loss=1.76107 mlm_acc=62.32967 nsp_loss=0.06079 nsp_acc=97.692 throughput=142.0K tks/s lr=0.0000746 time=137.80 INFO:root:[step 253999] mlm_loss=1.78432 mlm_acc=63.19772 nsp_loss=0.04409 nsp_acc=98.396 throughput=134.0K tks/s lr=0.0000746 time=131.08 INFO:root:[step 254249] mlm_loss=1.75978 mlm_acc=63.44739 nsp_loss=0.04006 nsp_acc=98.555 throughput=132.0K tks/s lr=0.0000746 time=129.14 INFO:root:[step 254499] mlm_loss=1.62408 mlm_acc=65.09135 nsp_loss=0.04615 nsp_acc=98.333 throughput=126.0K tks/s lr=0.0000746 time=111.49 INFO:root:[step 254749] mlm_loss=1.82870 mlm_acc=63.12301 nsp_loss=0.04136 nsp_acc=98.488 throughput=141.0K tks/s lr=0.0000745 time=138.31 INFO:root:[step 254999] mlm_loss=1.60126 mlm_acc=65.23363 nsp_loss=0.04499 nsp_acc=98.409 throughput=115.0K tks/s lr=0.0000745 time=117.33 INFO:root:[step 254999] Saving checkpoints to /home/ubuntu/ckpt-master/0254999.params, /home/ubuntu/ckpt-master/0254999.states. INFO:root:[step 255249] mlm_loss=1.64052 mlm_acc=64.65783 nsp_loss=0.04544 nsp_acc=98.338 throughput=110.0K tks/s lr=0.0000745 time=126.01 INFO:root:[step 255499] mlm_loss=1.77187 mlm_acc=62.02390 nsp_loss=0.10814 nsp_acc=95.642 throughput=142.0K tks/s lr=0.0000745 time=138.28 INFO:root:[step 255749] mlm_loss=1.91012 mlm_acc=60.12674 nsp_loss=0.11238 nsp_acc=95.197 throughput=142.0K tks/s lr=0.0000744 time=144.01 INFO:root:[step 255999] mlm_loss=1.57338 mlm_acc=65.39796 nsp_loss=0.04793 nsp_acc=98.329 throughput=123.0K tks/s lr=0.0000744 time=108.01 INFO:root:[step 256249] mlm_loss=1.73908 mlm_acc=62.06214 nsp_loss=0.07749 nsp_acc=96.947 throughput=136.0K tks/s lr=0.0000744 time=136.17 INFO:root:[step 256499] mlm_loss=1.58192 mlm_acc=65.42377 nsp_loss=0.05242 nsp_acc=98.083 throughput=123.0K tks/s lr=0.0000744 time=110.75 INFO:root:[step 256749] mlm_loss=1.67898 mlm_acc=64.35582 nsp_loss=0.04939 nsp_acc=98.184 throughput=114.0K tks/s lr=0.0000743 time=121.29 INFO:root:[step 256999] mlm_loss=1.71678 mlm_acc=61.95733 nsp_loss=0.07400 nsp_acc=97.171 throughput=133.0K tks/s lr=0.0000743 time=116.73 INFO:root:[step 257249] mlm_loss=1.84733 mlm_acc=62.69858 nsp_loss=0.04592 nsp_acc=98.277 throughput=137.0K tks/s lr=0.0000743 time=135.79 INFO:root:[step 257499] mlm_loss=1.64371 mlm_acc=64.40427 nsp_loss=0.05512 nsp_acc=97.970 throughput=120.0K tks/s lr=0.0000743 time=122.26 INFO:root:[step 257749] mlm_loss=1.92633 mlm_acc=59.97857 nsp_loss=0.12801 nsp_acc=94.550 throughput=155.0K tks/s lr=0.0000742 time=159.31 INFO:root:[step 257999] mlm_loss=1.88718 mlm_acc=61.90428 nsp_loss=0.05433 nsp_acc=97.888 throughput=142.0K tks/s lr=0.0000742 time=136.02 INFO:root:[step 258249] mlm_loss=1.87636 mlm_acc=61.83985 nsp_loss=0.08230 nsp_acc=96.533 throughput=148.0K tks/s lr=0.0000742 time=143.88 INFO:root:[step 258499] mlm_loss=1.66119 mlm_acc=63.27365 nsp_loss=0.10776 nsp_acc=95.561 throughput=143.0K tks/s lr=0.0000742 time=144.51 INFO:root:[step 258749] mlm_loss=1.53673 mlm_acc=65.70476 nsp_loss=0.05043 nsp_acc=98.273 throughput=116.0K tks/s lr=0.0000741 time=106.26 INFO:root:[step 258999] mlm_loss=1.78447 mlm_acc=62.63889 nsp_loss=0.06254 nsp_acc=97.607 throughput=133.0K tks/s lr=0.0000741 time=128.73 INFO:root:[step 259249] mlm_loss=1.96985 mlm_acc=60.54256 nsp_loss=0.12240 nsp_acc=94.978 throughput=148.0K tks/s lr=0.0000741 time=146.54 INFO:root:[step 259499] mlm_loss=1.91725 mlm_acc=62.16719 nsp_loss=0.04009 nsp_acc=98.568 throughput=150.0K tks/s lr=0.0000741 time=145.59 INFO:root:[step 259749] mlm_loss=1.85537 mlm_acc=62.76558 nsp_loss=0.04159 nsp_acc=98.468 throughput=138.0K tks/s lr=0.0000740 time=136.13 INFO:root:[step 259999] mlm_loss=1.78915 mlm_acc=63.05817 nsp_loss=0.04326 nsp_acc=98.455 throughput=136.0K tks/s lr=0.0000740 time=133.71 INFO:root:[step 259999] Saving checkpoints to /home/ubuntu/ckpt-master/0259999.params, /home/ubuntu/ckpt-master/0259999.states. INFO:root:[step 260249] mlm_loss=1.65025 mlm_acc=64.74523 nsp_loss=0.04779 nsp_acc=98.285 throughput=109.0K tks/s lr=0.0000740 time=125.70 INFO:root:[step 260499] mlm_loss=1.62296 mlm_acc=64.76448 nsp_loss=0.04660 nsp_acc=98.310 throughput=121.0K tks/s lr=0.0000740 time=118.16 INFO:root:[step 260749] mlm_loss=1.71846 mlm_acc=63.36232 nsp_loss=0.04127 nsp_acc=98.542 throughput=130.0K tks/s lr=0.0000739 time=129.17 INFO:root:[step 260999] mlm_loss=1.89920 mlm_acc=61.59812 nsp_loss=0.05286 nsp_acc=98.016 throughput=151.0K tks/s lr=0.0000739 time=150.10 INFO:root:[step 261249] mlm_loss=1.92790 mlm_acc=61.42767 nsp_loss=0.08083 nsp_acc=96.742 throughput=154.0K tks/s lr=0.0000739 time=151.79 INFO:root:[step 261499] mlm_loss=1.80807 mlm_acc=63.13640 nsp_loss=0.04274 nsp_acc=98.407 throughput=133.0K tks/s lr=0.0000739 time=132.74 INFO:root:[step 261749] mlm_loss=1.76258 mlm_acc=63.76114 nsp_loss=0.04579 nsp_acc=98.356 throughput=138.0K tks/s lr=0.0000738 time=117.93 INFO:root:[step 261999] mlm_loss=1.79118 mlm_acc=63.62528 nsp_loss=0.04158 nsp_acc=98.432 throughput=136.0K tks/s lr=0.0000738 time=130.84 INFO:root:[step 262249] mlm_loss=1.61520 mlm_acc=65.06633 nsp_loss=0.04409 nsp_acc=98.410 throughput=123.0K tks/s lr=0.0000738 time=119.96 INFO:root:[step 262499] mlm_loss=1.92178 mlm_acc=60.91969 nsp_loss=0.06390 nsp_acc=97.477 throughput=145.0K tks/s lr=0.0000738 time=149.68 INFO:root:[step 262749] mlm_loss=1.67938 mlm_acc=64.53565 nsp_loss=0.04924 nsp_acc=98.196 throughput=126.0K tks/s lr=0.0000737 time=113.10 INFO:root:[step 262999] mlm_loss=1.70545 mlm_acc=64.11424 nsp_loss=0.04618 nsp_acc=98.340 throughput=124.0K tks/s lr=0.0000737 time=122.74 INFO:root:[step 263249] mlm_loss=1.85647 mlm_acc=62.76610 nsp_loss=0.04169 nsp_acc=98.471 throughput=139.0K tks/s lr=0.0000737 time=137.23 INFO:root:[step 263499] mlm_loss=1.65504 mlm_acc=64.80548 nsp_loss=0.04966 nsp_acc=98.234 throughput=125.0K tks/s lr=0.0000737 time=109.55 INFO:root:[step 263749] mlm_loss=1.66318 mlm_acc=64.54815 nsp_loss=0.04679 nsp_acc=98.268 throughput=118.0K tks/s lr=0.0000736 time=121.21 INFO:root:[step 263999] mlm_loss=1.64608 mlm_acc=64.43968 nsp_loss=0.04258 nsp_acc=98.522 throughput=137.0K tks/s lr=0.0000736 time=114.90 INFO:root:[step 264249] mlm_loss=1.66189 mlm_acc=64.47533 nsp_loss=0.04639 nsp_acc=98.316 throughput=119.0K tks/s lr=0.0000736 time=125.72 INFO:root:[step 264499] mlm_loss=1.60764 mlm_acc=63.17130 nsp_loss=0.08200 nsp_acc=96.794 throughput=140.0K tks/s lr=0.0000736 time=123.64 INFO:root:[step 264749] mlm_loss=1.74448 mlm_acc=63.66701 nsp_loss=0.04673 nsp_acc=98.354 throughput=129.0K tks/s lr=0.0000735 time=128.54 INFO:root:[step 264999] mlm_loss=1.80877 mlm_acc=63.09823 nsp_loss=0.05541 nsp_acc=97.866 throughput=153.0K tks/s lr=0.0000735 time=151.34 INFO:root:[step 264999] Saving checkpoints to /home/ubuntu/ckpt-master/0264999.params, /home/ubuntu/ckpt-master/0264999.states. INFO:root:[step 265249] mlm_loss=1.82685 mlm_acc=63.28079 nsp_loss=0.04303 nsp_acc=98.385 throughput=126.0K tks/s lr=0.0000735 time=150.55 INFO:root:[step 265499] mlm_loss=1.65814 mlm_acc=64.63679 nsp_loss=0.04437 nsp_acc=98.425 throughput=118.0K tks/s lr=0.0000735 time=121.93 INFO:root:[step 265749] mlm_loss=1.73444 mlm_acc=63.80641 nsp_loss=0.04261 nsp_acc=98.478 throughput=132.0K tks/s lr=0.0000734 time=128.59 INFO:root:[step 265999] mlm_loss=1.77015 mlm_acc=62.89177 nsp_loss=0.09663 nsp_acc=95.988 throughput=149.0K tks/s lr=0.0000734 time=132.17 INFO:root:[step 266249] mlm_loss=1.76287 mlm_acc=62.10642 nsp_loss=0.08530 nsp_acc=96.649 throughput=137.0K tks/s lr=0.0000734 time=136.90 INFO:root:[step 266499] mlm_loss=1.58113 mlm_acc=65.61432 nsp_loss=0.05070 nsp_acc=98.163 throughput=116.0K tks/s lr=0.0000734 time=105.81 INFO:root:[step 266749] mlm_loss=1.73072 mlm_acc=62.37619 nsp_loss=0.09523 nsp_acc=96.111 throughput=133.0K tks/s lr=0.0000733 time=133.78 INFO:root:[step 266999] mlm_loss=1.90007 mlm_acc=61.14538 nsp_loss=0.05858 nsp_acc=97.761 throughput=147.0K tks/s lr=0.0000733 time=143.63 INFO:root:[step 267249] mlm_loss=1.59946 mlm_acc=64.56197 nsp_loss=0.05586 nsp_acc=97.942 throughput=114.0K tks/s lr=0.0000733 time=117.61 INFO:root:[step 267499] mlm_loss=1.68012 mlm_acc=63.73529 nsp_loss=0.04797 nsp_acc=98.277 throughput=136.0K tks/s lr=0.0000733 time=126.99 INFO:root:[step 267749] mlm_loss=1.90059 mlm_acc=61.24658 nsp_loss=0.06870 nsp_acc=97.254 throughput=145.0K tks/s lr=0.0000732 time=147.45 INFO:root:[step 267999] mlm_loss=1.79861 mlm_acc=62.49092 nsp_loss=0.06111 nsp_acc=97.653 throughput=143.0K tks/s lr=0.0000732 time=141.79 INFO:root:[step 268249] mlm_loss=1.80636 mlm_acc=63.49780 nsp_loss=0.04118 nsp_acc=98.512 throughput=138.0K tks/s lr=0.0000732 time=134.93 INFO:root:[step 268499] mlm_loss=1.83060 mlm_acc=61.51033 nsp_loss=0.05719 nsp_acc=97.805 throughput=140.0K tks/s lr=0.0000732 time=142.08 INFO:root:[step 268749] mlm_loss=1.65865 mlm_acc=64.70011 nsp_loss=0.04695 nsp_acc=98.327 throughput=128.0K tks/s lr=0.0000731 time=110.89 INFO:root:[step 268999] mlm_loss=1.74889 mlm_acc=63.51522 nsp_loss=0.04245 nsp_acc=98.468 throughput=134.0K tks/s lr=0.0000731 time=130.53 INFO:root:[step 269249] mlm_loss=1.72916 mlm_acc=61.60863 nsp_loss=0.05062 nsp_acc=98.133 throughput=134.0K tks/s lr=0.0000731 time=136.01 INFO:root:[step 269499] mlm_loss=1.59213 mlm_acc=64.16911 nsp_loss=0.08418 nsp_acc=96.593 throughput=132.0K tks/s lr=0.0000731 time=116.30 INFO:root:[step 269749] mlm_loss=1.54913 mlm_acc=66.66714 nsp_loss=0.09638 nsp_acc=96.184 throughput=147.0K tks/s lr=0.0000730 time=143.70 INFO:root:[step 269999] mlm_loss=1.70440 mlm_acc=63.59988 nsp_loss=0.11202 nsp_acc=95.463 throughput=157.0K tks/s lr=0.0000730 time=170.52 INFO:root:[step 269999] Saving checkpoints to /home/ubuntu/ckpt-master/0269999.params, /home/ubuntu/ckpt-master/0269999.states. INFO:root:[step 270249] mlm_loss=1.77758 mlm_acc=61.71586 nsp_loss=0.07980 nsp_acc=96.985 throughput=125.0K tks/s lr=0.0000730 time=143.26 INFO:root:[step 270499] mlm_loss=1.65139 mlm_acc=63.56124 nsp_loss=0.06320 nsp_acc=97.573 throughput=138.0K tks/s lr=0.0000730 time=137.58 INFO:root:[step 270749] mlm_loss=1.78999 mlm_acc=62.49590 nsp_loss=0.07943 nsp_acc=96.910 throughput=148.0K tks/s lr=0.0000729 time=147.34 INFO:root:[step 270999] mlm_loss=1.80310 mlm_acc=63.71565 nsp_loss=0.04303 nsp_acc=98.422 throughput=134.0K tks/s lr=0.0000729 time=131.35 INFO:root:[step 271249] mlm_loss=1.71316 mlm_acc=64.19100 nsp_loss=0.04711 nsp_acc=98.265 throughput=122.0K tks/s lr=0.0000729 time=123.47 INFO:root:[step 271499] mlm_loss=1.65423 mlm_acc=64.77802 nsp_loss=0.04501 nsp_acc=98.410 throughput=130.0K tks/s lr=0.0000729 time=113.22 INFO:root:[step 271749] mlm_loss=1.78586 mlm_acc=63.45274 nsp_loss=0.03945 nsp_acc=98.579 throughput=133.0K tks/s lr=0.0000728 time=135.27 INFO:root:[step 271999] mlm_loss=1.66442 mlm_acc=63.87494 nsp_loss=0.08464 nsp_acc=96.566 throughput=142.0K tks/s lr=0.0000728 time=140.12 INFO:root:[step 272249] mlm_loss=1.74391 mlm_acc=64.10237 nsp_loss=0.04302 nsp_acc=98.428 throughput=135.0K tks/s lr=0.0000728 time=118.21 INFO:root:[step 272499] mlm_loss=1.83187 mlm_acc=62.64045 nsp_loss=0.06834 nsp_acc=97.332 throughput=148.0K tks/s lr=0.0000728 time=142.89 INFO:root:[step 272749] mlm_loss=1.54362 mlm_acc=65.32116 nsp_loss=0.05436 nsp_acc=97.997 throughput=108.0K tks/s lr=0.0000727 time=116.52 INFO:root:[step 272999] mlm_loss=1.69648 mlm_acc=64.32275 nsp_loss=0.04735 nsp_acc=98.252 throughput=131.0K tks/s lr=0.0000727 time=112.58 INFO:root:[step 273249] mlm_loss=1.97204 mlm_acc=59.51402 nsp_loss=0.08746 nsp_acc=96.519 throughput=149.0K tks/s lr=0.0000727 time=170.03 INFO:root:[step 273499] mlm_loss=1.61310 mlm_acc=64.96773 nsp_loss=0.04909 nsp_acc=98.192 throughput=121.0K tks/s lr=0.0000727 time=109.86 INFO:root:[step 273749] mlm_loss=1.66136 mlm_acc=65.15046 nsp_loss=0.04595 nsp_acc=98.336 throughput=125.0K tks/s lr=0.0000726 time=111.98 INFO:root:[step 273999] mlm_loss=1.87565 mlm_acc=61.82901 nsp_loss=0.08823 nsp_acc=96.450 throughput=146.0K tks/s lr=0.0000726 time=141.81 INFO:root:[step 274249] mlm_loss=1.63627 mlm_acc=64.74004 nsp_loss=0.04663 nsp_acc=98.288 throughput=115.0K tks/s lr=0.0000726 time=118.20 INFO:root:[step 274499] mlm_loss=1.60542 mlm_acc=65.23690 nsp_loss=0.04992 nsp_acc=98.170 throughput=120.0K tks/s lr=0.0000726 time=108.74 INFO:root:[step 274749] mlm_loss=1.79376 mlm_acc=62.84767 nsp_loss=0.05758 nsp_acc=97.743 throughput=140.0K tks/s lr=0.0000725 time=132.81 INFO:root:[step 274999] mlm_loss=1.70649 mlm_acc=63.22562 nsp_loss=0.06489 nsp_acc=97.501 throughput=130.0K tks/s lr=0.0000725 time=132.21 INFO:root:[step 274999] Saving checkpoints to /home/ubuntu/ckpt-master/0274999.params, /home/ubuntu/ckpt-master/0274999.states. INFO:root:[step 275249] mlm_loss=1.42842 mlm_acc=71.18027 nsp_loss=0.06769 nsp_acc=97.621 throughput=133.0K tks/s lr=0.0000725 time=147.91 INFO:root:[step 275499] mlm_loss=1.86483 mlm_acc=62.62390 nsp_loss=0.04153 nsp_acc=98.495 throughput=142.0K tks/s lr=0.0000725 time=138.20 INFO:root:[step 275749] mlm_loss=1.88555 mlm_acc=61.62111 nsp_loss=0.06101 nsp_acc=97.661 throughput=146.0K tks/s lr=0.0000724 time=162.34 INFO:root:[step 275999] mlm_loss=1.78355 mlm_acc=63.97091 nsp_loss=0.04501 nsp_acc=98.353 throughput=139.0K tks/s lr=0.0000724 time=119.95 INFO:root:[step 276249] mlm_loss=1.82208 mlm_acc=62.33774 nsp_loss=0.06690 nsp_acc=97.408 throughput=146.0K tks/s lr=0.0000724 time=145.20 INFO:root:[step 276499] mlm_loss=1.85989 mlm_acc=61.58631 nsp_loss=0.05624 nsp_acc=97.869 throughput=144.0K tks/s lr=0.0000724 time=155.32 INFO:root:[step 276749] mlm_loss=1.93169 mlm_acc=60.77524 nsp_loss=0.05423 nsp_acc=97.935 throughput=149.0K tks/s lr=0.0000723 time=146.63 INFO:root:[step 276999] mlm_loss=1.92691 mlm_acc=61.22510 nsp_loss=0.07205 nsp_acc=97.159 throughput=138.0K tks/s lr=0.0000723 time=140.61 INFO:root:[step 277249] mlm_loss=1.71362 mlm_acc=62.80223 nsp_loss=0.07821 nsp_acc=96.893 throughput=142.0K tks/s lr=0.0000723 time=123.72 INFO:root:[step 277499] mlm_loss=1.74670 mlm_acc=63.17768 nsp_loss=0.04645 nsp_acc=98.187 throughput=131.0K tks/s lr=0.0000723 time=133.44 INFO:root:[step 277749] mlm_loss=1.91799 mlm_acc=59.89248 nsp_loss=0.07593 nsp_acc=97.077 throughput=150.0K tks/s lr=0.0000722 time=148.48 INFO:root:[step 277999] mlm_loss=1.86747 mlm_acc=61.67475 nsp_loss=0.05645 nsp_acc=97.858 throughput=148.0K tks/s lr=0.0000722 time=144.80 INFO:root:[step 278249] mlm_loss=1.83713 mlm_acc=63.08436 nsp_loss=0.04443 nsp_acc=98.356 throughput=139.0K tks/s lr=0.0000722 time=137.09 INFO:root:[step 278499] mlm_loss=1.61096 mlm_acc=65.13409 nsp_loss=0.04637 nsp_acc=98.368 throughput=116.0K tks/s lr=0.0000722 time=119.98 INFO:root:[step 278749] mlm_loss=1.71818 mlm_acc=63.37908 nsp_loss=0.06319 nsp_acc=97.611 throughput=140.0K tks/s lr=0.0000721 time=138.15 INFO:root:[step 278999] mlm_loss=1.74474 mlm_acc=63.74923 nsp_loss=0.04626 nsp_acc=98.261 throughput=139.0K tks/s lr=0.0000721 time=118.74 INFO:root:[step 279249] mlm_loss=1.84380 mlm_acc=62.33442 nsp_loss=0.07693 nsp_acc=96.959 throughput=148.0K tks/s lr=0.0000721 time=156.92 INFO:root:[step 279499] mlm_loss=1.90259 mlm_acc=61.52753 nsp_loss=0.08111 nsp_acc=96.772 throughput=154.0K tks/s lr=0.0000721 time=154.93 INFO:root:[step 279749] mlm_loss=1.70475 mlm_acc=63.80237 nsp_loss=0.06240 nsp_acc=97.583 throughput=139.0K tks/s lr=0.0000720 time=138.79 INFO:root:[step 279999] mlm_loss=1.72424 mlm_acc=64.04699 nsp_loss=0.04669 nsp_acc=98.327 throughput=132.0K tks/s lr=0.0000720 time=117.26 INFO:root:[step 279999] Saving checkpoints to /home/ubuntu/ckpt-master/0279999.params, /home/ubuntu/ckpt-master/0279999.states. INFO:root:[step 280249] mlm_loss=1.67736 mlm_acc=64.14692 nsp_loss=0.05820 nsp_acc=97.814 throughput=110.0K tks/s lr=0.0000720 time=137.27 INFO:root:[step 280499] mlm_loss=1.83206 mlm_acc=62.38180 nsp_loss=0.10239 nsp_acc=95.647 throughput=143.0K tks/s lr=0.0000720 time=144.48 INFO:root:[step 280749] mlm_loss=1.56246 mlm_acc=65.74589 nsp_loss=0.04904 nsp_acc=98.219 throughput=117.0K tks/s lr=0.0000719 time=105.72 INFO:root:[step 280999] mlm_loss=1.74147 mlm_acc=61.70697 nsp_loss=0.04999 nsp_acc=98.111 throughput=144.0K tks/s lr=0.0000719 time=140.27 INFO:root:[step 281249] mlm_loss=1.62554 mlm_acc=64.86023 nsp_loss=0.04696 nsp_acc=98.246 throughput=125.0K tks/s lr=0.0000719 time=125.84 INFO:root:[step 281499] mlm_loss=1.77017 mlm_acc=63.46460 nsp_loss=0.04152 nsp_acc=98.483 throughput=145.0K tks/s lr=0.0000719 time=124.46 INFO:root:[step 281749] mlm_loss=1.84917 mlm_acc=63.24401 nsp_loss=0.04192 nsp_acc=98.445 throughput=138.0K tks/s lr=0.0000718 time=136.21 INFO:root:[step 281999] mlm_loss=1.57635 mlm_acc=65.01249 nsp_loss=0.04967 nsp_acc=98.153 throughput=112.0K tks/s lr=0.0000718 time=121.53 INFO:root:[step 282249] mlm_loss=1.54606 mlm_acc=65.70588 nsp_loss=0.04861 nsp_acc=98.244 throughput=115.0K tks/s lr=0.0000718 time=105.84 INFO:root:[step 282499] mlm_loss=1.65939 mlm_acc=62.95657 nsp_loss=0.05997 nsp_acc=97.737 throughput=135.0K tks/s lr=0.0000718 time=134.67 INFO:root:[step 282749] mlm_loss=1.54774 mlm_acc=65.07270 nsp_loss=0.06620 nsp_acc=97.471 throughput=114.0K tks/s lr=0.0000717 time=106.73 INFO:root:[step 282999] mlm_loss=1.81318 mlm_acc=61.99168 nsp_loss=0.07230 nsp_acc=97.217 throughput=143.0K tks/s lr=0.0000717 time=136.17 INFO:root:[step 283249] mlm_loss=1.74332 mlm_acc=63.87764 nsp_loss=0.04637 nsp_acc=98.314 throughput=133.0K tks/s lr=0.0000717 time=121.29 INFO:root:[step 283499] mlm_loss=1.73861 mlm_acc=61.62682 nsp_loss=0.07126 nsp_acc=97.326 throughput=134.0K tks/s lr=0.0000717 time=133.52 INFO:root:[step 283749] mlm_loss=1.59432 mlm_acc=64.82801 nsp_loss=0.05558 nsp_acc=97.972 throughput=116.0K tks/s lr=0.0000716 time=117.08 INFO:root:[step 283999] mlm_loss=1.79470 mlm_acc=61.71342 nsp_loss=0.07246 nsp_acc=97.142 throughput=139.0K tks/s lr=0.0000716 time=126.49 INFO:root:[step 284249] mlm_loss=1.72263 mlm_acc=63.68984 nsp_loss=0.04235 nsp_acc=98.456 throughput=132.0K tks/s lr=0.0000716 time=132.04 INFO:root:[step 284499] mlm_loss=1.78778 mlm_acc=63.38433 nsp_loss=0.04317 nsp_acc=98.469 throughput=134.0K tks/s lr=0.0000716 time=130.17 INFO:root:[step 284749] mlm_loss=1.86466 mlm_acc=62.86407 nsp_loss=0.03938 nsp_acc=98.509 throughput=146.0K tks/s lr=0.0000715 time=141.16 INFO:root:[step 284999] mlm_loss=1.63708 mlm_acc=64.58187 nsp_loss=0.04770 nsp_acc=98.290 throughput=121.0K tks/s lr=0.0000715 time=124.22 INFO:root:[step 284999] Saving checkpoints to /home/ubuntu/ckpt-master/0284999.params, /home/ubuntu/ckpt-master/0284999.states. INFO:root:[step 285249] mlm_loss=1.79457 mlm_acc=63.63413 nsp_loss=0.04125 nsp_acc=98.445 throughput=124.0K tks/s lr=0.0000715 time=144.04 INFO:root:[step 285499] mlm_loss=1.57432 mlm_acc=65.78242 nsp_loss=0.04665 nsp_acc=98.353 throughput=111.0K tks/s lr=0.0000715 time=118.67 INFO:root:[step 285749] mlm_loss=1.56416 mlm_acc=67.87487 nsp_loss=0.05437 nsp_acc=97.987 throughput=138.0K tks/s lr=0.0000714 time=122.17 INFO:root:[step 285999] mlm_loss=1.63847 mlm_acc=65.21082 nsp_loss=0.06075 nsp_acc=97.746 throughput=126.0K tks/s lr=0.0000714 time=123.63 INFO:root:[step 286249] mlm_loss=1.85857 mlm_acc=62.24979 nsp_loss=0.05815 nsp_acc=97.752 throughput=143.0K tks/s lr=0.0000714 time=141.33 INFO:root:[step 286499] mlm_loss=1.91005 mlm_acc=61.42048 nsp_loss=0.06865 nsp_acc=97.303 throughput=138.0K tks/s lr=0.0000714 time=144.47 INFO:root:[step 286749] mlm_loss=1.66006 mlm_acc=64.11928 nsp_loss=0.04558 nsp_acc=98.363 throughput=134.0K tks/s lr=0.0000713 time=114.79 INFO:root:[step 286999] mlm_loss=1.74510 mlm_acc=64.00994 nsp_loss=0.04442 nsp_acc=98.351 throughput=125.0K tks/s lr=0.0000713 time=128.26 INFO:root:[step 287249] mlm_loss=1.61613 mlm_acc=64.85780 nsp_loss=0.05133 nsp_acc=98.167 throughput=128.0K tks/s lr=0.0000713 time=114.75 INFO:root:[step 287499] mlm_loss=1.71502 mlm_acc=62.72219 nsp_loss=0.05680 nsp_acc=97.896 throughput=134.0K tks/s lr=0.0000713 time=131.31 INFO:root:[step 287749] mlm_loss=1.89185 mlm_acc=62.16215 nsp_loss=0.04846 nsp_acc=98.178 throughput=147.0K tks/s lr=0.0000712 time=143.40 INFO:root:[step 287999] mlm_loss=1.73326 mlm_acc=64.17585 nsp_loss=0.04281 nsp_acc=98.441 throughput=130.0K tks/s lr=0.0000712 time=131.94 INFO:root:[step 288249] mlm_loss=1.63022 mlm_acc=65.18736 nsp_loss=0.04603 nsp_acc=98.340 throughput=122.0K tks/s lr=0.0000712 time=108.10 INFO:root:[step 288499] mlm_loss=1.73064 mlm_acc=62.06761 nsp_loss=0.06490 nsp_acc=97.475 throughput=141.0K tks/s lr=0.0000712 time=140.80 INFO:root:[step 288749] mlm_loss=1.69507 mlm_acc=64.31580 nsp_loss=0.04555 nsp_acc=98.355 throughput=127.0K tks/s lr=0.0000711 time=124.92 INFO:root:[step 288999] mlm_loss=1.35313 mlm_acc=71.72538 nsp_loss=0.06380 nsp_acc=97.743 throughput=142.0K tks/s lr=0.0000711 time=126.77 INFO:root:[step 289249] mlm_loss=1.77470 mlm_acc=63.16529 nsp_loss=0.04456 nsp_acc=98.397 throughput=136.0K tks/s lr=0.0000711 time=132.64 INFO:root:[step 289499] mlm_loss=1.78228 mlm_acc=64.34550 nsp_loss=0.04140 nsp_acc=98.516 throughput=145.0K tks/s lr=0.0000711 time=141.60 INFO:root:[step 289749] mlm_loss=1.71834 mlm_acc=64.12120 nsp_loss=0.04255 nsp_acc=98.496 throughput=135.0K tks/s lr=0.0000710 time=131.99 INFO:root:[step 289999] mlm_loss=1.68469 mlm_acc=64.91994 nsp_loss=0.04442 nsp_acc=98.387 throughput=126.0K tks/s lr=0.0000710 time=121.65 INFO:root:[step 289999] Saving checkpoints to /home/ubuntu/ckpt-master/0289999.params, /home/ubuntu/ckpt-master/0289999.states. INFO:root:[step 290249] mlm_loss=1.72483 mlm_acc=64.19655 nsp_loss=0.04098 nsp_acc=98.583 throughput=114.0K tks/s lr=0.0000710 time=147.08 INFO:root:[step 290499] mlm_loss=1.66218 mlm_acc=64.69210 nsp_loss=0.04691 nsp_acc=98.307 throughput=133.0K tks/s lr=0.0000710 time=115.38 INFO:root:[step 290749] mlm_loss=1.78053 mlm_acc=63.84038 nsp_loss=0.04243 nsp_acc=98.455 throughput=133.0K tks/s lr=0.0000709 time=131.79 INFO:root:[step 290999] mlm_loss=1.68233 mlm_acc=64.54770 nsp_loss=0.04541 nsp_acc=98.346 throughput=130.0K tks/s lr=0.0000709 time=112.80 INFO:root:[step 291249] mlm_loss=1.63190 mlm_acc=65.15533 nsp_loss=0.04592 nsp_acc=98.341 throughput=114.0K tks/s lr=0.0000709 time=117.31 INFO:root:[step 291499] mlm_loss=1.63470 mlm_acc=64.90280 nsp_loss=0.04597 nsp_acc=98.361 throughput=134.0K tks/s lr=0.0000709 time=113.41 INFO:root:[step 291749] mlm_loss=1.76040 mlm_acc=63.44255 nsp_loss=0.04198 nsp_acc=98.469 throughput=131.0K tks/s lr=0.0000708 time=133.59 INFO:root:[step 291999] mlm_loss=1.69078 mlm_acc=64.57210 nsp_loss=0.04399 nsp_acc=98.418 throughput=135.0K tks/s lr=0.0000708 time=115.71 INFO:root:[step 292249] mlm_loss=1.67063 mlm_acc=65.00066 nsp_loss=0.04664 nsp_acc=98.245 throughput=123.0K tks/s lr=0.0000708 time=124.92 INFO:root:[step 292499] mlm_loss=1.76703 mlm_acc=63.61503 nsp_loss=0.04254 nsp_acc=98.415 throughput=135.0K tks/s lr=0.0000708 time=132.29 INFO:root:[step 292749] mlm_loss=1.76471 mlm_acc=62.72587 nsp_loss=0.04663 nsp_acc=98.311 throughput=145.0K tks/s lr=0.0000707 time=135.73 INFO:root:[step 292999] mlm_loss=1.79246 mlm_acc=62.82228 nsp_loss=0.04762 nsp_acc=98.208 throughput=138.0K tks/s lr=0.0000707 time=138.62 INFO:root:[step 293249] mlm_loss=1.76955 mlm_acc=64.00498 nsp_loss=0.04372 nsp_acc=98.352 throughput=140.0K tks/s lr=0.0000707 time=120.54 INFO:root:[step 293499] mlm_loss=1.71933 mlm_acc=64.91817 nsp_loss=0.04703 nsp_acc=98.291 throughput=135.0K tks/s lr=0.0000707 time=130.90 INFO:root:[step 293749] mlm_loss=1.62858 mlm_acc=65.45867 nsp_loss=0.04603 nsp_acc=98.378 throughput=117.0K tks/s lr=0.0000706 time=116.09 INFO:root:[step 293999] mlm_loss=1.72803 mlm_acc=63.78693 nsp_loss=0.04652 nsp_acc=98.317 throughput=136.0K tks/s lr=0.0000706 time=125.68 INFO:root:[step 294249] mlm_loss=1.66905 mlm_acc=64.75237 nsp_loss=0.04534 nsp_acc=98.331 throughput=123.0K tks/s lr=0.0000706 time=123.67 INFO:root:[step 294499] mlm_loss=1.64853 mlm_acc=63.69873 nsp_loss=0.09984 nsp_acc=95.949 throughput=135.0K tks/s lr=0.0000706 time=131.65 INFO:root:[step 294749] mlm_loss=1.66438 mlm_acc=64.83813 nsp_loss=0.04211 nsp_acc=98.481 throughput=125.0K tks/s lr=0.0000705 time=115.07 INFO:root:[step 294999] mlm_loss=1.63690 mlm_acc=65.39609 nsp_loss=0.04748 nsp_acc=98.269 throughput=129.0K tks/s lr=0.0000705 time=114.65 INFO:root:[step 294999] Saving checkpoints to /home/ubuntu/ckpt-master/0294999.params, /home/ubuntu/ckpt-master/0294999.states. INFO:root:[step 295249] mlm_loss=1.34375 mlm_acc=67.70956 nsp_loss=0.05510 nsp_acc=98.040 throughput=91.0K tks/s lr=0.0000705 time=115.04 INFO:root:[step 295499] mlm_loss=1.67761 mlm_acc=63.34760 nsp_loss=0.07602 nsp_acc=97.025 throughput=138.0K tks/s lr=0.0000705 time=136.45 INFO:root:[step 295749] mlm_loss=1.87971 mlm_acc=61.32765 nsp_loss=0.08186 nsp_acc=96.799 throughput=146.0K tks/s lr=0.0000704 time=142.83 INFO:root:[step 295999] mlm_loss=1.66162 mlm_acc=64.67379 nsp_loss=0.04623 nsp_acc=98.320 throughput=120.0K tks/s lr=0.0000704 time=121.13 INFO:root:[step 296249] mlm_loss=1.64876 mlm_acc=65.08599 nsp_loss=0.04356 nsp_acc=98.440 throughput=127.0K tks/s lr=0.0000704 time=115.23 INFO:root:[step 296499] mlm_loss=1.71739 mlm_acc=63.26635 nsp_loss=0.04747 nsp_acc=98.247 throughput=131.0K tks/s lr=0.0000704 time=124.87 INFO:root:[step 296749] mlm_loss=1.65985 mlm_acc=62.49183 nsp_loss=0.05153 nsp_acc=98.134 throughput=132.0K tks/s lr=0.0000703 time=123.03 INFO:root:[step 296999] mlm_loss=1.71018 mlm_acc=64.43111 nsp_loss=0.04498 nsp_acc=98.362 throughput=127.0K tks/s lr=0.0000703 time=124.65 INFO:root:[step 297249] mlm_loss=1.75207 mlm_acc=63.64511 nsp_loss=0.04404 nsp_acc=98.399 throughput=133.0K tks/s lr=0.0000703 time=132.14 INFO:root:[step 297499] mlm_loss=1.77152 mlm_acc=61.96562 nsp_loss=0.06571 nsp_acc=97.501 throughput=137.0K tks/s lr=0.0000703 time=140.08 INFO:root:[step 297749] mlm_loss=1.58250 mlm_acc=65.51644 nsp_loss=0.04498 nsp_acc=98.385 throughput=120.0K tks/s lr=0.0000702 time=111.47 INFO:root:[step 297999] mlm_loss=1.56268 mlm_acc=65.81495 nsp_loss=0.04924 nsp_acc=98.243 throughput=119.0K tks/s lr=0.0000702 time=107.00 INFO:root:[step 298249] mlm_loss=1.77939 mlm_acc=63.53841 nsp_loss=0.04100 nsp_acc=98.488 throughput=134.0K tks/s lr=0.0000702 time=132.00 INFO:root:[step 298499] mlm_loss=1.90509 mlm_acc=61.44347 nsp_loss=0.05497 nsp_acc=97.824 throughput=147.0K tks/s lr=0.0000702 time=159.74 INFO:root:[step 298749] mlm_loss=1.72406 mlm_acc=64.47733 nsp_loss=0.04242 nsp_acc=98.445 throughput=139.0K tks/s lr=0.0000701 time=120.97 INFO:root:[step 298999] mlm_loss=1.55393 mlm_acc=65.81935 nsp_loss=0.04728 nsp_acc=98.291 throughput=114.0K tks/s lr=0.0000701 time=119.34 INFO:root:[step 299249] mlm_loss=1.64031 mlm_acc=64.16136 nsp_loss=0.08811 nsp_acc=96.448 throughput=140.0K tks/s lr=0.0000701 time=117.71 INFO:root:[step 299499] mlm_loss=1.89592 mlm_acc=61.19150 nsp_loss=0.11957 nsp_acc=94.945 throughput=153.0K tks/s lr=0.0000701 time=151.93 INFO:root:[step 299749] mlm_loss=1.67929 mlm_acc=64.70599 nsp_loss=0.04618 nsp_acc=98.345 throughput=122.0K tks/s lr=0.0000700 time=123.52 INFO:root:[step 299999] mlm_loss=1.48072 mlm_acc=66.08403 nsp_loss=0.04959 nsp_acc=98.145 throughput=118.0K tks/s lr=0.0000700 time=106.32 INFO:root:[step 299999] Saving checkpoints to /home/ubuntu/ckpt-master/0299999.params, /home/ubuntu/ckpt-master/0299999.states. INFO:root:[step 300249] mlm_loss=1.76968 mlm_acc=62.85816 nsp_loss=0.04264 nsp_acc=98.470 throughput=129.0K tks/s lr=0.0000700 time=155.35 INFO:root:[step 300499] mlm_loss=1.74722 mlm_acc=64.05680 nsp_loss=0.04716 nsp_acc=98.256 throughput=131.0K tks/s lr=0.0000700 time=131.70 INFO:root:[step 300749] mlm_loss=1.47053 mlm_acc=67.32620 nsp_loss=0.05414 nsp_acc=98.122 throughput=122.0K tks/s lr=0.0000699 time=107.69 INFO:root:[step 300999] mlm_loss=1.69948 mlm_acc=64.54426 nsp_loss=0.05026 nsp_acc=98.167 throughput=128.0K tks/s lr=0.0000699 time=127.74 INFO:root:[step 301249] mlm_loss=1.75156 mlm_acc=61.65587 nsp_loss=0.06383 nsp_acc=97.627 throughput=137.0K tks/s lr=0.0000699 time=137.11 INFO:root:[step 301499] mlm_loss=1.69768 mlm_acc=63.65296 nsp_loss=0.09529 nsp_acc=96.155 throughput=131.0K tks/s lr=0.0000699 time=135.18 INFO:root:[step 301749] mlm_loss=1.49978 mlm_acc=66.24351 nsp_loss=0.05248 nsp_acc=98.102 throughput=115.0K tks/s lr=0.0000698 time=106.80 INFO:root:[step 301999] mlm_loss=1.80511 mlm_acc=61.45304 nsp_loss=0.07038 nsp_acc=97.265 throughput=144.0K tks/s lr=0.0000698 time=137.54 INFO:root:[step 302249] mlm_loss=1.74601 mlm_acc=61.86429 nsp_loss=0.08284 nsp_acc=96.766 throughput=150.0K tks/s lr=0.0000698 time=156.61 INFO:root:[step 302499] mlm_loss=1.55053 mlm_acc=65.42550 nsp_loss=0.05210 nsp_acc=98.115 throughput=133.0K tks/s lr=0.0000698 time=113.86 INFO:root:[step 302749] mlm_loss=1.75915 mlm_acc=62.43907 nsp_loss=0.05255 nsp_acc=97.972 throughput=134.0K tks/s lr=0.0000697 time=130.06 INFO:root:[step 302999] mlm_loss=1.86374 mlm_acc=62.47334 nsp_loss=0.04586 nsp_acc=98.285 throughput=141.0K tks/s lr=0.0000697 time=141.31 INFO:root:[step 303249] mlm_loss=1.66328 mlm_acc=64.90312 nsp_loss=0.04434 nsp_acc=98.404 throughput=118.0K tks/s lr=0.0000697 time=121.57 INFO:root:[step 303499] mlm_loss=1.69098 mlm_acc=64.71076 nsp_loss=0.04498 nsp_acc=98.393 throughput=139.0K tks/s lr=0.0000697 time=116.88 INFO:root:[step 303749] mlm_loss=1.83469 mlm_acc=62.44942 nsp_loss=0.07385 nsp_acc=97.001 throughput=150.0K tks/s lr=0.0000696 time=145.71 INFO:root:[step 303999] mlm_loss=1.63192 mlm_acc=64.98515 nsp_loss=0.04814 nsp_acc=98.300 throughput=117.0K tks/s lr=0.0000696 time=120.94 INFO:root:[step 304249] mlm_loss=1.74245 mlm_acc=62.39202 nsp_loss=0.06955 nsp_acc=97.344 throughput=147.0K tks/s lr=0.0000696 time=141.01 INFO:root:[step 304499] mlm_loss=1.38263 mlm_acc=69.70339 nsp_loss=0.08239 nsp_acc=96.954 throughput=155.0K tks/s lr=0.0000696 time=156.61 INFO:root:[step 304749] mlm_loss=1.89007 mlm_acc=60.71381 nsp_loss=0.05760 nsp_acc=97.819 throughput=145.0K tks/s lr=0.0000695 time=146.71 INFO:root:[step 304999] mlm_loss=1.66389 mlm_acc=64.92096 nsp_loss=0.04649 nsp_acc=98.299 throughput=123.0K tks/s lr=0.0000695 time=123.51 INFO:root:[step 304999] Saving checkpoints to /home/ubuntu/ckpt-master/0304999.params, /home/ubuntu/ckpt-master/0304999.states. INFO:root:[step 305249] mlm_loss=1.66365 mlm_acc=62.67643 nsp_loss=0.05949 nsp_acc=97.739 throughput=124.0K tks/s lr=0.0000695 time=156.42 INFO:root:[step 305499] mlm_loss=1.68335 mlm_acc=63.31458 nsp_loss=0.06095 nsp_acc=97.651 throughput=139.0K tks/s lr=0.0000695 time=119.91 INFO:root:[step 305749] mlm_loss=1.66613 mlm_acc=63.86462 nsp_loss=0.05543 nsp_acc=97.950 throughput=123.0K tks/s lr=0.0000694 time=124.73 INFO:root:[step 305999] mlm_loss=1.80780 mlm_acc=62.55752 nsp_loss=0.06986 nsp_acc=97.176 throughput=145.0K tks/s lr=0.0000694 time=146.24 INFO:root:[step 306249] mlm_loss=1.53286 mlm_acc=66.03132 nsp_loss=0.04212 nsp_acc=98.464 throughput=121.0K tks/s lr=0.0000694 time=107.28 INFO:root:[step 306499] mlm_loss=1.40262 mlm_acc=67.07009 nsp_loss=0.03657 nsp_acc=98.728 throughput=118.0K tks/s lr=0.0000694 time=107.46 INFO:root:[step 306749] mlm_loss=1.59309 mlm_acc=65.47435 nsp_loss=0.04027 nsp_acc=98.552 throughput=121.0K tks/s lr=0.0000693 time=121.07 INFO:root:[step 306999] mlm_loss=1.66707 mlm_acc=64.55298 nsp_loss=0.03517 nsp_acc=98.700 throughput=136.0K tks/s lr=0.0000693 time=116.00 INFO:root:[step 307249] mlm_loss=1.58413 mlm_acc=64.90246 nsp_loss=0.06086 nsp_acc=97.571 throughput=123.0K tks/s lr=0.0000693 time=120.95 INFO:root:[step 307499] mlm_loss=1.90064 mlm_acc=61.34136 nsp_loss=0.08128 nsp_acc=96.701 throughput=148.0K tks/s lr=0.0000693 time=145.31 INFO:root:[step 307749] mlm_loss=1.77644 mlm_acc=60.67633 nsp_loss=0.06624 nsp_acc=97.414 throughput=143.0K tks/s lr=0.0000692 time=150.48 INFO:root:[step 307999] mlm_loss=1.68524 mlm_acc=62.00897 nsp_loss=0.09128 nsp_acc=96.360 throughput=151.0K tks/s lr=0.0000692 time=149.36 INFO:root:[step 308249] mlm_loss=1.63304 mlm_acc=63.55302 nsp_loss=0.05190 nsp_acc=98.030 throughput=132.0K tks/s lr=0.0000692 time=129.87 INFO:root:[step 308499] mlm_loss=1.93268 mlm_acc=60.91991 nsp_loss=0.09764 nsp_acc=95.968 throughput=149.0K tks/s lr=0.0000692 time=149.34 INFO:root:[step 308749] mlm_loss=1.89534 mlm_acc=60.92799 nsp_loss=0.07119 nsp_acc=97.098 throughput=156.0K tks/s lr=0.0000691 time=155.77 INFO:root:[step 308999] mlm_loss=1.81910 mlm_acc=62.54784 nsp_loss=0.06093 nsp_acc=97.542 throughput=150.0K tks/s lr=0.0000691 time=148.60 INFO:root:[step 309249] mlm_loss=1.43546 mlm_acc=70.30403 nsp_loss=0.05438 nsp_acc=98.106 throughput=144.0K tks/s lr=0.0000691 time=142.67 INFO:root:[step 309499] mlm_loss=1.69448 mlm_acc=63.27854 nsp_loss=0.05549 nsp_acc=97.823 throughput=137.0K tks/s lr=0.0000691 time=139.92 INFO:root:[step 309749] mlm_loss=1.57662 mlm_acc=65.43122 nsp_loss=0.03851 nsp_acc=98.633 throughput=119.0K tks/s lr=0.0000690 time=120.64 INFO:root:[step 309999] mlm_loss=1.68914 mlm_acc=64.77781 nsp_loss=0.04127 nsp_acc=98.480 throughput=134.0K tks/s lr=0.0000690 time=114.93 INFO:root:[step 309999] Saving checkpoints to /home/ubuntu/ckpt-master/0309999.params, /home/ubuntu/ckpt-master/0309999.states. INFO:root:[step 310249] mlm_loss=1.65812 mlm_acc=64.81418 nsp_loss=0.03814 nsp_acc=98.654 throughput=111.0K tks/s lr=0.0000690 time=135.82 INFO:root:[step 310499] mlm_loss=1.69860 mlm_acc=64.57522 nsp_loss=0.03672 nsp_acc=98.665 throughput=135.0K tks/s lr=0.0000690 time=120.01 INFO:root:[step 310749] mlm_loss=1.68055 mlm_acc=64.07306 nsp_loss=0.03757 nsp_acc=98.660 throughput=131.0K tks/s lr=0.0000689 time=131.98 INFO:root:[step 310999] mlm_loss=1.75637 mlm_acc=62.46883 nsp_loss=0.06510 nsp_acc=97.474 throughput=146.0K tks/s lr=0.0000689 time=140.47 INFO:root:[step 311249] mlm_loss=1.84793 mlm_acc=62.27014 nsp_loss=0.07364 nsp_acc=96.947 throughput=149.0K tks/s lr=0.0000689 time=146.35 INFO:root:[step 311499] mlm_loss=2.02996 mlm_acc=59.98002 nsp_loss=0.07575 nsp_acc=96.945 throughput=139.0K tks/s lr=0.0000689 time=136.95 INFO:root:[step 311749] mlm_loss=1.88396 mlm_acc=61.64879 nsp_loss=0.04636 nsp_acc=98.278 throughput=153.0K tks/s lr=0.0000688 time=162.95 INFO:root:[step 311999] mlm_loss=1.61902 mlm_acc=64.41563 nsp_loss=0.05383 nsp_acc=98.022 throughput=141.0K tks/s lr=0.0000688 time=132.43 INFO:root:[step 312249] mlm_loss=1.67550 mlm_acc=64.69324 nsp_loss=0.03631 nsp_acc=98.717 throughput=128.0K tks/s lr=0.0000688 time=126.91 INFO:root:[step 312499] mlm_loss=1.55583 mlm_acc=65.91211 nsp_loss=0.04337 nsp_acc=98.476 throughput=120.0K tks/s lr=0.0000688 time=110.92 INFO:root:[step 312749] mlm_loss=1.53545 mlm_acc=65.83416 nsp_loss=0.04816 nsp_acc=98.268 throughput=114.0K tks/s lr=0.0000687 time=116.09 INFO:root:[step 312999] mlm_loss=1.80694 mlm_acc=62.79007 nsp_loss=0.06937 nsp_acc=97.242 throughput=148.0K tks/s lr=0.0000687 time=147.12 INFO:root:[step 313249] mlm_loss=1.71195 mlm_acc=64.81813 nsp_loss=0.03619 nsp_acc=98.740 throughput=131.0K tks/s lr=0.0000687 time=131.98 INFO:root:[step 313499] mlm_loss=1.60050 mlm_acc=65.02256 nsp_loss=0.03593 nsp_acc=98.678 throughput=131.0K tks/s lr=0.0000687 time=113.68 INFO:root:[step 313749] mlm_loss=1.67825 mlm_acc=64.39099 nsp_loss=0.04195 nsp_acc=98.467 throughput=134.0K tks/s lr=0.0000686 time=128.08 INFO:root:[step 313999] mlm_loss=1.66688 mlm_acc=63.78776 nsp_loss=0.05636 nsp_acc=97.900 throughput=130.0K tks/s lr=0.0000686 time=141.00 INFO:root:[step 314249] mlm_loss=1.36053 mlm_acc=66.39418 nsp_loss=0.05369 nsp_acc=98.088 throughput=115.0K tks/s lr=0.0000686 time=101.30 INFO:root:[step 314499] mlm_loss=1.80702 mlm_acc=62.36255 nsp_loss=0.04037 nsp_acc=98.473 throughput=141.0K tks/s lr=0.0000686 time=145.77 INFO:root:[step 314749] mlm_loss=1.56090 mlm_acc=65.94946 nsp_loss=0.04259 nsp_acc=98.473 throughput=121.0K tks/s lr=0.0000685 time=108.76 INFO:root:[step 314999] mlm_loss=1.52749 mlm_acc=66.30794 nsp_loss=0.04304 nsp_acc=98.468 throughput=121.0K tks/s lr=0.0000685 time=108.67 INFO:root:[step 314999] Saving checkpoints to /home/ubuntu/ckpt-master/0314999.params, /home/ubuntu/ckpt-master/0314999.states. INFO:root:[step 315249] mlm_loss=1.68989 mlm_acc=64.08559 nsp_loss=0.03842 nsp_acc=98.601 throughput=120.0K tks/s lr=0.0000685 time=146.25 INFO:root:[step 315499] mlm_loss=1.86145 mlm_acc=60.81255 nsp_loss=0.07803 nsp_acc=96.950 throughput=154.0K tks/s lr=0.0000685 time=157.49 INFO:root:[step 315749] mlm_loss=1.71731 mlm_acc=64.00229 nsp_loss=0.04238 nsp_acc=98.453 throughput=132.0K tks/s lr=0.0000684 time=129.90 INFO:root:[step 315999] mlm_loss=1.67129 mlm_acc=64.72571 nsp_loss=0.04033 nsp_acc=98.568 throughput=123.0K tks/s lr=0.0000684 time=126.41 INFO:root:[step 316249] mlm_loss=1.68235 mlm_acc=63.93042 nsp_loss=0.03406 nsp_acc=98.740 throughput=134.0K tks/s lr=0.0000684 time=130.29 INFO:root:[step 316499] mlm_loss=1.56872 mlm_acc=65.58087 nsp_loss=0.04097 nsp_acc=98.546 throughput=122.0K tks/s lr=0.0000684 time=110.10 INFO:root:[step 316749] mlm_loss=1.70666 mlm_acc=64.48576 nsp_loss=0.03810 nsp_acc=98.670 throughput=129.0K tks/s lr=0.0000683 time=126.84 INFO:root:[step 316999] mlm_loss=1.64133 mlm_acc=65.20268 nsp_loss=0.04394 nsp_acc=98.410 throughput=125.0K tks/s lr=0.0000683 time=112.63 INFO:root:[step 317249] mlm_loss=1.71815 mlm_acc=63.98436 nsp_loss=0.04760 nsp_acc=98.217 throughput=141.0K tks/s lr=0.0000683 time=134.48 INFO:root:[step 317499] mlm_loss=1.75944 mlm_acc=63.49772 nsp_loss=0.05109 nsp_acc=98.064 throughput=141.0K tks/s lr=0.0000683 time=142.49 INFO:root:[step 317749] mlm_loss=1.73359 mlm_acc=64.05639 nsp_loss=0.03476 nsp_acc=98.734 throughput=138.0K tks/s lr=0.0000682 time=133.28 INFO:root:[step 317999] mlm_loss=1.72715 mlm_acc=64.43199 nsp_loss=0.03651 nsp_acc=98.666 throughput=137.0K tks/s lr=0.0000682 time=119.27 INFO:root:[step 318249] mlm_loss=1.73169 mlm_acc=63.15227 nsp_loss=0.07843 nsp_acc=96.909 throughput=136.0K tks/s lr=0.0000682 time=135.11 INFO:root:[step 318499] mlm_loss=1.76825 mlm_acc=62.66306 nsp_loss=0.07512 nsp_acc=96.969 throughput=146.0K tks/s lr=0.0000682 time=148.92 INFO:root:[step 318749] mlm_loss=1.78012 mlm_acc=61.96981 nsp_loss=0.05436 nsp_acc=97.958 throughput=143.0K tks/s lr=0.0000681 time=145.21 INFO:root:[step 318999] mlm_loss=1.61651 mlm_acc=65.34257 nsp_loss=0.03885 nsp_acc=98.612 throughput=118.0K tks/s lr=0.0000681 time=120.43 INFO:root:[step 319249] mlm_loss=1.66514 mlm_acc=64.69141 nsp_loss=0.03882 nsp_acc=98.632 throughput=140.0K tks/s lr=0.0000681 time=120.24 INFO:root:[step 319499] mlm_loss=1.56269 mlm_acc=65.84235 nsp_loss=0.04112 nsp_acc=98.524 throughput=118.0K tks/s lr=0.0000681 time=120.23 INFO:root:[step 319749] mlm_loss=1.57827 mlm_acc=65.69986 nsp_loss=0.04620 nsp_acc=98.284 throughput=122.0K tks/s lr=0.0000680 time=110.22 INFO:root:[step 319999] mlm_loss=1.65803 mlm_acc=64.38208 nsp_loss=0.04006 nsp_acc=98.534 throughput=130.0K tks/s lr=0.0000680 time=129.88 INFO:root:[step 319999] Saving checkpoints to /home/ubuntu/ckpt-master/0319999.params, /home/ubuntu/ckpt-master/0319999.states. INFO:root:[step 320249] mlm_loss=1.67200 mlm_acc=64.58018 nsp_loss=0.03908 nsp_acc=98.615 throughput=116.0K tks/s lr=0.0000680 time=142.56 INFO:root:[step 320499] mlm_loss=1.74042 mlm_acc=64.05241 nsp_loss=0.03325 nsp_acc=98.761 throughput=141.0K tks/s lr=0.0000680 time=136.15 INFO:root:[step 320749] mlm_loss=1.81365 mlm_acc=63.51969 nsp_loss=0.03603 nsp_acc=98.673 throughput=142.0K tks/s lr=0.0000679 time=142.11 INFO:root:[step 320999] mlm_loss=1.69254 mlm_acc=64.31616 nsp_loss=0.04388 nsp_acc=98.417 throughput=138.0K tks/s lr=0.0000679 time=120.25 INFO:root:[step 321249] mlm_loss=1.88136 mlm_acc=61.66951 nsp_loss=0.05620 nsp_acc=97.796 throughput=147.0K tks/s lr=0.0000679 time=144.00 INFO:root:[step 321499] mlm_loss=1.66080 mlm_acc=62.48189 nsp_loss=0.07728 nsp_acc=96.985 throughput=135.0K tks/s lr=0.0000679 time=137.61 INFO:root:[step 321749] mlm_loss=1.75400 mlm_acc=61.80068 nsp_loss=0.09656 nsp_acc=96.024 throughput=153.0K tks/s lr=0.0000678 time=151.94 INFO:root:[step 321999] mlm_loss=1.69989 mlm_acc=64.30964 nsp_loss=0.04135 nsp_acc=98.501 throughput=134.0K tks/s lr=0.0000678 time=131.71 INFO:root:[step 322249] mlm_loss=1.68981 mlm_acc=63.31642 nsp_loss=0.04022 nsp_acc=98.562 throughput=133.0K tks/s lr=0.0000678 time=127.80 INFO:root:[step 322499] mlm_loss=1.79965 mlm_acc=62.29952 nsp_loss=0.07240 nsp_acc=97.002 throughput=142.0K tks/s lr=0.0000678 time=142.81 INFO:root:[step 322749] mlm_loss=1.58438 mlm_acc=64.73647 nsp_loss=0.07655 nsp_acc=96.952 throughput=130.0K tks/s lr=0.0000677 time=116.09 INFO:root:[step 322999] mlm_loss=2.00711 mlm_acc=59.85538 nsp_loss=0.08820 nsp_acc=96.335 throughput=145.0K tks/s lr=0.0000677 time=157.63 INFO:root:[step 323249] mlm_loss=1.76643 mlm_acc=62.13979 nsp_loss=0.06698 nsp_acc=97.441 throughput=148.0K tks/s lr=0.0000677 time=151.90 INFO:root:[step 323499] mlm_loss=1.54755 mlm_acc=65.99965 nsp_loss=0.04476 nsp_acc=98.389 throughput=122.0K tks/s lr=0.0000677 time=108.73 INFO:root:[step 323749] mlm_loss=1.54556 mlm_acc=66.03434 nsp_loss=0.04500 nsp_acc=98.433 throughput=113.0K tks/s lr=0.0000676 time=117.95 INFO:root:[step 323999] mlm_loss=1.65259 mlm_acc=64.60813 nsp_loss=0.03809 nsp_acc=98.654 throughput=138.0K tks/s lr=0.0000676 time=119.37 INFO:root:[step 324249] mlm_loss=1.52708 mlm_acc=65.92197 nsp_loss=0.04098 nsp_acc=98.521 throughput=112.0K tks/s lr=0.0000676 time=117.63 INFO:root:[step 324499] mlm_loss=1.64385 mlm_acc=65.16832 nsp_loss=0.04323 nsp_acc=98.445 throughput=124.0K tks/s lr=0.0000676 time=112.11 INFO:root:[step 324749] mlm_loss=1.61959 mlm_acc=65.30898 nsp_loss=0.04215 nsp_acc=98.463 throughput=127.0K tks/s lr=0.0000675 time=111.49 INFO:root:[step 324999] mlm_loss=1.62183 mlm_acc=65.35591 nsp_loss=0.04290 nsp_acc=98.392 throughput=114.0K tks/s lr=0.0000675 time=117.49 INFO:root:[step 324999] Saving checkpoints to /home/ubuntu/ckpt-master/0324999.params, /home/ubuntu/ckpt-master/0324999.states. INFO:root:[step 325249] mlm_loss=1.72682 mlm_acc=64.04809 nsp_loss=0.03981 nsp_acc=98.515 throughput=128.0K tks/s lr=0.0000675 time=136.58 INFO:root:[step 325499] mlm_loss=1.53223 mlm_acc=65.99134 nsp_loss=0.04335 nsp_acc=98.488 throughput=113.0K tks/s lr=0.0000675 time=117.43 INFO:root:[step 325749] mlm_loss=1.81707 mlm_acc=61.27733 nsp_loss=0.07523 nsp_acc=97.058 throughput=141.0K tks/s lr=0.0000674 time=132.84 INFO:root:[step 325999] mlm_loss=1.82158 mlm_acc=62.35900 nsp_loss=0.05787 nsp_acc=97.753 throughput=139.0K tks/s lr=0.0000674 time=142.70 INFO:root:[step 326249] mlm_loss=1.60006 mlm_acc=65.10726 nsp_loss=0.04036 nsp_acc=98.552 throughput=132.0K tks/s lr=0.0000674 time=117.33 INFO:root:[step 326499] mlm_loss=1.69717 mlm_acc=64.73789 nsp_loss=0.04028 nsp_acc=98.487 throughput=132.0K tks/s lr=0.0000674 time=127.95 INFO:root:[step 326749] mlm_loss=1.70459 mlm_acc=64.93148 nsp_loss=0.04900 nsp_acc=98.239 throughput=149.0K tks/s lr=0.0000673 time=143.62 INFO:root:[step 326999] mlm_loss=1.75052 mlm_acc=61.97964 nsp_loss=0.06482 nsp_acc=97.540 throughput=145.0K tks/s lr=0.0000673 time=149.61 INFO:root:[step 327249] mlm_loss=1.80950 mlm_acc=61.65407 nsp_loss=0.07705 nsp_acc=97.023 throughput=146.0K tks/s lr=0.0000673 time=142.50 INFO:root:[step 327499] mlm_loss=1.82429 mlm_acc=61.63677 nsp_loss=0.06215 nsp_acc=97.615 throughput=146.0K tks/s lr=0.0000673 time=147.96 INFO:root:[step 327749] mlm_loss=1.68048 mlm_acc=64.66467 nsp_loss=0.04754 nsp_acc=98.240 throughput=132.0K tks/s lr=0.0000672 time=125.85 INFO:root:[step 327999] mlm_loss=1.88354 mlm_acc=62.12940 nsp_loss=0.04326 nsp_acc=98.310 throughput=152.0K tks/s lr=0.0000672 time=154.13 INFO:root:[step 328249] mlm_loss=1.94211 mlm_acc=61.14198 nsp_loss=0.07826 nsp_acc=96.837 throughput=149.0K tks/s lr=0.0000672 time=148.51 INFO:root:[step 328499] mlm_loss=1.69159 mlm_acc=64.48875 nsp_loss=0.04393 nsp_acc=98.389 throughput=128.0K tks/s lr=0.0000672 time=127.72 INFO:root:[step 328749] mlm_loss=1.65074 mlm_acc=64.93152 nsp_loss=0.04036 nsp_acc=98.626 throughput=128.0K tks/s lr=0.0000671 time=125.28 INFO:root:[step 328999] mlm_loss=1.55138 mlm_acc=66.35312 nsp_loss=0.04082 nsp_acc=98.574 throughput=125.0K tks/s lr=0.0000671 time=113.22 INFO:root:[step 329249] mlm_loss=1.66907 mlm_acc=64.26978 nsp_loss=0.12851 nsp_acc=94.655 throughput=132.0K tks/s lr=0.0000671 time=128.85 INFO:root:[step 329499] mlm_loss=1.28333 mlm_acc=72.51199 nsp_loss=0.06044 nsp_acc=97.859 throughput=137.0K tks/s lr=0.0000671 time=125.26 INFO:root:[step 329749] mlm_loss=1.53523 mlm_acc=65.87930 nsp_loss=0.05702 nsp_acc=97.866 throughput=114.0K tks/s lr=0.0000670 time=108.12 INFO:root:[step 329999] mlm_loss=1.83212 mlm_acc=62.31863 nsp_loss=0.04346 nsp_acc=98.346 throughput=147.0K tks/s lr=0.0000670 time=160.97 INFO:root:[step 329999] Saving checkpoints to /home/ubuntu/ckpt-master/0329999.params, /home/ubuntu/ckpt-master/0329999.states. INFO:root:[step 330249] mlm_loss=1.71304 mlm_acc=63.84160 nsp_loss=0.08584 nsp_acc=96.487 throughput=126.0K tks/s lr=0.0000670 time=156.91 INFO:root:[step 330499] mlm_loss=1.48743 mlm_acc=66.45436 nsp_loss=0.04578 nsp_acc=98.332 throughput=116.0K tks/s lr=0.0000670 time=106.84 INFO:root:[step 330749] mlm_loss=1.56240 mlm_acc=65.74387 nsp_loss=0.04276 nsp_acc=98.430 throughput=127.0K tks/s lr=0.0000669 time=109.94 INFO:root:[step 330999] mlm_loss=1.53952 mlm_acc=66.17163 nsp_loss=0.04468 nsp_acc=98.385 throughput=109.0K tks/s lr=0.0000669 time=114.18 INFO:root:[step 331249] mlm_loss=1.61977 mlm_acc=65.17035 nsp_loss=0.03693 nsp_acc=98.696 throughput=133.0K tks/s lr=0.0000669 time=115.92 INFO:root:[step 331499] mlm_loss=1.76291 mlm_acc=64.04842 nsp_loss=0.03974 nsp_acc=98.600 throughput=136.0K tks/s lr=0.0000669 time=133.45 INFO:root:[step 331749] mlm_loss=1.79169 mlm_acc=61.58441 nsp_loss=0.06452 nsp_acc=97.497 throughput=137.0K tks/s lr=0.0000668 time=136.29 INFO:root:[step 331999] mlm_loss=1.70315 mlm_acc=62.67366 nsp_loss=0.07619 nsp_acc=97.008 throughput=134.0K tks/s lr=0.0000668 time=115.12 INFO:root:[step 332249] mlm_loss=1.72971 mlm_acc=63.86201 nsp_loss=0.04817 nsp_acc=98.216 throughput=128.0K tks/s lr=0.0000668 time=126.34 INFO:root:[step 332499] mlm_loss=1.82605 mlm_acc=62.77555 nsp_loss=0.08290 nsp_acc=96.581 throughput=153.0K tks/s lr=0.0000668 time=151.98 INFO:root:[step 332749] mlm_loss=1.80040 mlm_acc=62.64018 nsp_loss=0.04917 nsp_acc=98.149 throughput=140.0K tks/s lr=0.0000667 time=135.07 INFO:root:[step 332999] mlm_loss=1.73768 mlm_acc=62.99786 nsp_loss=0.04464 nsp_acc=98.358 throughput=139.0K tks/s lr=0.0000667 time=140.58 INFO:root:[step 333249] mlm_loss=1.65394 mlm_acc=64.32869 nsp_loss=0.04119 nsp_acc=98.449 throughput=131.0K tks/s lr=0.0000667 time=127.54 INFO:root:[step 333499] mlm_loss=1.72536 mlm_acc=63.03158 nsp_loss=0.07292 nsp_acc=97.044 throughput=144.0K tks/s lr=0.0000667 time=135.53 INFO:root:[step 333749] mlm_loss=1.73773 mlm_acc=62.87597 nsp_loss=0.07425 nsp_acc=97.096 throughput=146.0K tks/s lr=0.0000666 time=132.01 INFO:root:[step 333999] mlm_loss=1.48259 mlm_acc=66.10267 nsp_loss=0.04783 nsp_acc=98.240 throughput=107.0K tks/s lr=0.0000666 time=116.06 INFO:root:[step 334249] mlm_loss=1.54938 mlm_acc=64.99418 nsp_loss=0.10129 nsp_acc=95.868 throughput=132.0K tks/s lr=0.0000666 time=118.88 INFO:root:[step 334499] mlm_loss=1.71242 mlm_acc=63.53609 nsp_loss=0.07942 nsp_acc=96.742 throughput=132.0K tks/s lr=0.0000666 time=129.61 INFO:root:[step 334749] mlm_loss=1.84214 mlm_acc=62.25120 nsp_loss=0.08313 nsp_acc=96.461 throughput=152.0K tks/s lr=0.0000665 time=153.15 INFO:root:[step 334999] mlm_loss=1.77760 mlm_acc=62.79551 nsp_loss=0.06771 nsp_acc=97.156 throughput=146.0K tks/s lr=0.0000665 time=143.49 INFO:root:[step 334999] Saving checkpoints to /home/ubuntu/ckpt-master/0334999.params, /home/ubuntu/ckpt-master/0334999.states. INFO:root:[step 335249] mlm_loss=1.58155 mlm_acc=64.62352 nsp_loss=0.04904 nsp_acc=98.288 throughput=108.0K tks/s lr=0.0000665 time=143.53 INFO:root:[step 335499] mlm_loss=1.57515 mlm_acc=65.66399 nsp_loss=0.04330 nsp_acc=98.445 throughput=123.0K tks/s lr=0.0000665 time=111.21 INFO:root:[step 335749] mlm_loss=1.63080 mlm_acc=64.19982 nsp_loss=0.06087 nsp_acc=97.757 throughput=141.0K tks/s lr=0.0000664 time=138.45 INFO:root:[step 335999] mlm_loss=1.65261 mlm_acc=63.50903 nsp_loss=0.09624 nsp_acc=96.021 throughput=135.0K tks/s lr=0.0000664 time=131.63 INFO:root:[step 336249] mlm_loss=1.54817 mlm_acc=66.28587 nsp_loss=0.04331 nsp_acc=98.403 throughput=123.0K tks/s lr=0.0000664 time=108.14 INFO:root:[step 336499] mlm_loss=1.50772 mlm_acc=66.50523 nsp_loss=0.04315 nsp_acc=98.439 throughput=121.0K tks/s lr=0.0000664 time=109.37 INFO:root:[step 336749] mlm_loss=1.78067 mlm_acc=62.85672 nsp_loss=0.05450 nsp_acc=97.886 throughput=149.0K tks/s lr=0.0000663 time=146.41 INFO:root:[step 336999] mlm_loss=1.69770 mlm_acc=63.95180 nsp_loss=0.04298 nsp_acc=98.398 throughput=134.0K tks/s lr=0.0000663 time=130.59 INFO:root:[step 337249] mlm_loss=1.77847 mlm_acc=62.12180 nsp_loss=0.06756 nsp_acc=97.385 throughput=152.0K tks/s lr=0.0000663 time=167.83 INFO:root:[step 337499] mlm_loss=1.77093 mlm_acc=63.74027 nsp_loss=0.03230 nsp_acc=98.800 throughput=139.0K tks/s lr=0.0000663 time=138.65 INFO:root:[step 337749] mlm_loss=1.54996 mlm_acc=66.12691 nsp_loss=0.04746 nsp_acc=98.241 throughput=119.0K tks/s lr=0.0000662 time=105.14 INFO:root:[step 337999] mlm_loss=1.72683 mlm_acc=64.43713 nsp_loss=0.04173 nsp_acc=98.486 throughput=137.0K tks/s lr=0.0000662 time=128.30 INFO:root:[step 338249] mlm_loss=1.80835 mlm_acc=63.27407 nsp_loss=0.03653 nsp_acc=98.645 throughput=142.0K tks/s lr=0.0000662 time=144.22 INFO:root:[step 338499] mlm_loss=1.66711 mlm_acc=65.07838 nsp_loss=0.04023 nsp_acc=98.560 throughput=135.0K tks/s lr=0.0000662 time=117.56 INFO:root:[step 338749] mlm_loss=1.57561 mlm_acc=65.89952 nsp_loss=0.03975 nsp_acc=98.628 throughput=121.0K tks/s lr=0.0000661 time=116.95 INFO:root:[step 338999] mlm_loss=1.78576 mlm_acc=63.91406 nsp_loss=0.03703 nsp_acc=98.639 throughput=139.0K tks/s lr=0.0000661 time=135.22 INFO:root:[step 339249] mlm_loss=1.72551 mlm_acc=65.20179 nsp_loss=0.03618 nsp_acc=98.698 throughput=145.0K tks/s lr=0.0000661 time=144.24 INFO:root:[step 339499] mlm_loss=1.65534 mlm_acc=65.14795 nsp_loss=0.03990 nsp_acc=98.573 throughput=131.0K tks/s lr=0.0000661 time=117.02 INFO:root:[step 339749] mlm_loss=1.69769 mlm_acc=64.72185 nsp_loss=0.03923 nsp_acc=98.628 throughput=129.0K tks/s lr=0.0000660 time=125.94 INFO:root:[step 339999] mlm_loss=1.53920 mlm_acc=66.06434 nsp_loss=0.05818 nsp_acc=97.892 throughput=133.0K tks/s lr=0.0000660 time=117.74 INFO:root:[step 339999] Saving checkpoints to /home/ubuntu/ckpt-master/0339999.params, /home/ubuntu/ckpt-master/0339999.states. INFO:root:[step 340249] mlm_loss=1.53459 mlm_acc=65.34642 nsp_loss=0.06217 nsp_acc=97.664 throughput=112.0K tks/s lr=0.0000660 time=137.16 INFO:root:[step 340499] mlm_loss=1.68274 mlm_acc=63.85367 nsp_loss=0.06622 nsp_acc=97.464 throughput=139.0K tks/s lr=0.0000660 time=141.91 INFO:root:[step 340749] mlm_loss=1.53011 mlm_acc=65.35722 nsp_loss=0.05097 nsp_acc=98.236 throughput=132.0K tks/s lr=0.0000659 time=116.09 INFO:root:[step 340999] mlm_loss=1.80555 mlm_acc=62.76869 nsp_loss=0.07310 nsp_acc=97.090 throughput=146.0K tks/s lr=0.0000659 time=163.99 INFO:root:[step 341249] mlm_loss=1.60187 mlm_acc=65.69012 nsp_loss=0.03935 nsp_acc=98.638 throughput=129.0K tks/s lr=0.0000659 time=113.25 INFO:root:[step 341499] mlm_loss=1.98632 mlm_acc=60.67559 nsp_loss=0.08847 nsp_acc=96.425 throughput=154.0K tks/s lr=0.0000659 time=153.67 INFO:root:[step 341749] mlm_loss=1.58130 mlm_acc=65.22324 nsp_loss=0.04801 nsp_acc=98.235 throughput=121.0K tks/s lr=0.0000658 time=122.11 INFO:root:[step 341999] mlm_loss=1.70602 mlm_acc=64.24373 nsp_loss=0.04045 nsp_acc=98.497 throughput=133.0K tks/s lr=0.0000658 time=133.20 INFO:root:[step 342249] mlm_loss=1.34030 mlm_acc=67.78572 nsp_loss=0.04849 nsp_acc=98.241 throughput=109.0K tks/s lr=0.0000658 time=101.13 INFO:root:[step 342499] mlm_loss=1.56174 mlm_acc=65.75525 nsp_loss=0.04495 nsp_acc=98.340 throughput=124.0K tks/s lr=0.0000658 time=111.10 INFO:root:[step 342749] mlm_loss=1.78716 mlm_acc=62.46694 nsp_loss=0.06021 nsp_acc=97.600 throughput=144.0K tks/s lr=0.0000657 time=140.41 INFO:root:[step 342999] mlm_loss=1.73816 mlm_acc=64.65179 nsp_loss=0.03832 nsp_acc=98.589 throughput=136.0K tks/s lr=0.0000657 time=130.39 INFO:root:[step 343249] mlm_loss=1.65431 mlm_acc=64.92883 nsp_loss=0.04292 nsp_acc=98.463 throughput=130.0K tks/s lr=0.0000657 time=117.10 INFO:root:[step 343499] mlm_loss=1.36051 mlm_acc=69.58267 nsp_loss=0.10241 nsp_acc=96.044 throughput=146.0K tks/s lr=0.0000657 time=164.23 INFO:root:[step 343749] mlm_loss=1.67380 mlm_acc=64.61483 nsp_loss=0.03994 nsp_acc=98.503 throughput=139.0K tks/s lr=0.0000656 time=119.02 INFO:root:[step 343999] mlm_loss=1.62974 mlm_acc=65.12366 nsp_loss=0.04207 nsp_acc=98.494 throughput=120.0K tks/s lr=0.0000656 time=122.45 INFO:root:[step 344249] mlm_loss=1.60062 mlm_acc=65.73397 nsp_loss=0.04242 nsp_acc=98.419 throughput=127.0K tks/s lr=0.0000656 time=110.87 INFO:root:[step 344499] mlm_loss=1.69013 mlm_acc=64.98328 nsp_loss=0.04358 nsp_acc=98.423 throughput=125.0K tks/s lr=0.0000656 time=125.91 INFO:root:[step 344749] mlm_loss=1.77278 mlm_acc=62.34095 nsp_loss=0.05925 nsp_acc=97.699 throughput=149.0K tks/s lr=0.0000655 time=143.28 INFO:root:[step 344999] mlm_loss=1.91246 mlm_acc=60.79878 nsp_loss=0.09775 nsp_acc=96.082 throughput=162.0K tks/s lr=0.0000655 time=170.01 INFO:root:[step 344999] Saving checkpoints to /home/ubuntu/ckpt-master/0344999.params, /home/ubuntu/ckpt-master/0344999.states. INFO:root:[step 345249] mlm_loss=2.06083 mlm_acc=59.73495 nsp_loss=0.10392 nsp_acc=95.904 throughput=127.0K tks/s lr=0.0000655 time=161.12 INFO:root:[step 345499] mlm_loss=1.68553 mlm_acc=64.61679 nsp_loss=0.04455 nsp_acc=98.366 throughput=129.0K tks/s lr=0.0000655 time=130.17 INFO:root:[step 345749] mlm_loss=1.83134 mlm_acc=61.35722 nsp_loss=0.04599 nsp_acc=98.298 throughput=147.0K tks/s lr=0.0000654 time=143.22 INFO:root:[step 345999] mlm_loss=1.63276 mlm_acc=65.34100 nsp_loss=0.04559 nsp_acc=98.349 throughput=127.0K tks/s lr=0.0000654 time=123.92 INFO:root:[step 346249] mlm_loss=1.73307 mlm_acc=64.75811 nsp_loss=0.04073 nsp_acc=98.437 throughput=138.0K tks/s lr=0.0000654 time=137.86 INFO:root:[step 346499] mlm_loss=1.65909 mlm_acc=64.86942 nsp_loss=0.03929 nsp_acc=98.583 throughput=139.0K tks/s lr=0.0000654 time=117.47 INFO:root:[step 346749] mlm_loss=1.56133 mlm_acc=65.98358 nsp_loss=0.04478 nsp_acc=98.363 throughput=120.0K tks/s lr=0.0000653 time=120.68 INFO:root:[step 346999] mlm_loss=1.70699 mlm_acc=64.73136 nsp_loss=0.03845 nsp_acc=98.560 throughput=139.0K tks/s lr=0.0000653 time=141.85 INFO:root:[step 347249] mlm_loss=1.64126 mlm_acc=64.87214 nsp_loss=0.04152 nsp_acc=98.465 throughput=140.0K tks/s lr=0.0000653 time=117.85 INFO:root:[step 347499] mlm_loss=1.63533 mlm_acc=65.39149 nsp_loss=0.04507 nsp_acc=98.385 throughput=123.0K tks/s lr=0.0000653 time=123.47 INFO:root:[step 347749] mlm_loss=1.86128 mlm_acc=61.71579 nsp_loss=0.08703 nsp_acc=96.412 throughput=154.0K tks/s lr=0.0000652 time=151.53 INFO:root:[step 347999] mlm_loss=1.55970 mlm_acc=68.09412 nsp_loss=0.05985 nsp_acc=97.776 throughput=141.0K tks/s lr=0.0000652 time=139.13 INFO:root:[step 348249] mlm_loss=1.71108 mlm_acc=65.46967 nsp_loss=0.07997 nsp_acc=96.845 throughput=135.0K tks/s lr=0.0000652 time=139.05 INFO:root:[step 348499] mlm_loss=1.61317 mlm_acc=65.60320 nsp_loss=0.04140 nsp_acc=98.535 throughput=128.0K tks/s lr=0.0000652 time=112.69 INFO:root:[step 348749] mlm_loss=1.68458 mlm_acc=64.54732 nsp_loss=0.03798 nsp_acc=98.617 throughput=134.0K tks/s lr=0.0000651 time=132.46 INFO:root:[step 348999] mlm_loss=1.62272 mlm_acc=65.60714 nsp_loss=0.04026 nsp_acc=98.562 throughput=122.0K tks/s lr=0.0000651 time=121.85 INFO:root:[step 349249] mlm_loss=1.63125 mlm_acc=65.25262 nsp_loss=0.04196 nsp_acc=98.496 throughput=134.0K tks/s lr=0.0000651 time=117.35 INFO:root:[step 349499] mlm_loss=1.75093 mlm_acc=63.60136 nsp_loss=0.05183 nsp_acc=98.122 throughput=136.0K tks/s lr=0.0000651 time=131.54 INFO:root:[step 349749] mlm_loss=1.86893 mlm_acc=62.18165 nsp_loss=0.05032 nsp_acc=98.059 throughput=149.0K tks/s lr=0.0000650 time=148.15 INFO:root:[step 349999] mlm_loss=1.48620 mlm_acc=66.21042 nsp_loss=0.04507 nsp_acc=98.380 throughput=113.0K tks/s lr=0.0000650 time=121.51 INFO:root:[step 349999] Saving checkpoints to /home/ubuntu/ckpt-master/0349999.params, /home/ubuntu/ckpt-master/0349999.states. INFO:root:[step 350249] mlm_loss=1.67702 mlm_acc=63.60363 nsp_loss=0.06367 nsp_acc=97.584 throughput=126.0K tks/s lr=0.0000650 time=135.11 INFO:root:[step 350499] mlm_loss=1.77788 mlm_acc=62.32533 nsp_loss=0.07399 nsp_acc=97.074 throughput=146.0K tks/s lr=0.0000650 time=144.99 INFO:root:[step 350749] mlm_loss=1.52717 mlm_acc=66.02805 nsp_loss=0.05225 nsp_acc=98.049 throughput=116.0K tks/s lr=0.0000649 time=106.79 INFO:root:[step 350999] mlm_loss=1.67593 mlm_acc=64.50100 nsp_loss=0.04480 nsp_acc=98.313 throughput=126.0K tks/s lr=0.0000649 time=129.92 INFO:root:[step 351249] mlm_loss=1.68304 mlm_acc=64.67723 nsp_loss=0.04201 nsp_acc=98.469 throughput=126.0K tks/s lr=0.0000649 time=123.01 INFO:root:[step 351499] mlm_loss=1.64624 mlm_acc=64.77651 nsp_loss=0.04502 nsp_acc=98.329 throughput=135.0K tks/s lr=0.0000649 time=122.32 INFO:root:[step 351749] mlm_loss=1.55256 mlm_acc=65.91255 nsp_loss=0.04942 nsp_acc=98.215 throughput=109.0K tks/s lr=0.0000648 time=115.97 INFO:root:[step 351999] mlm_loss=1.59498 mlm_acc=65.35414 nsp_loss=0.04300 nsp_acc=98.441 throughput=132.0K tks/s lr=0.0000648 time=112.53 INFO:root:[step 352249] mlm_loss=1.86766 mlm_acc=61.89742 nsp_loss=0.05460 nsp_acc=97.899 throughput=151.0K tks/s lr=0.0000648 time=150.24 INFO:root:[step 352499] mlm_loss=1.79678 mlm_acc=63.77347 nsp_loss=0.03591 nsp_acc=98.713 throughput=142.0K tks/s lr=0.0000648 time=138.49 INFO:root:[step 352749] mlm_loss=1.78316 mlm_acc=62.36829 nsp_loss=0.13129 nsp_acc=94.332 throughput=148.0K tks/s lr=0.0000647 time=161.59 INFO:root:[step 352999] mlm_loss=1.79879 mlm_acc=63.54668 nsp_loss=0.03687 nsp_acc=98.646 throughput=142.0K tks/s lr=0.0000647 time=140.07 INFO:root:[step 353249] mlm_loss=1.64022 mlm_acc=65.25954 nsp_loss=0.04116 nsp_acc=98.506 throughput=131.0K tks/s lr=0.0000647 time=113.28 INFO:root:[step 353499] mlm_loss=1.74414 mlm_acc=62.97335 nsp_loss=0.11419 nsp_acc=95.270 throughput=155.0K tks/s lr=0.0000647 time=154.62 INFO:root:[step 353749] mlm_loss=1.57428 mlm_acc=64.80345 nsp_loss=0.06481 nsp_acc=97.558 throughput=127.0K tks/s lr=0.0000646 time=125.93 INFO:root:[step 353999] mlm_loss=1.61454 mlm_acc=64.32340 nsp_loss=0.05469 nsp_acc=97.967 throughput=132.0K tks/s lr=0.0000646 time=115.39 INFO:root:[step 354249] mlm_loss=1.77191 mlm_acc=62.39106 nsp_loss=0.10015 nsp_acc=95.825 throughput=159.0K tks/s lr=0.0000646 time=176.99 INFO:root:[step 354499] mlm_loss=1.78783 mlm_acc=62.39289 nsp_loss=0.12182 nsp_acc=94.942 throughput=144.0K tks/s lr=0.0000646 time=143.07 INFO:root:[step 354749] mlm_loss=1.81589 mlm_acc=62.53920 nsp_loss=0.07243 nsp_acc=97.164 throughput=149.0K tks/s lr=0.0000645 time=147.75 INFO:root:[step 354999] mlm_loss=1.70670 mlm_acc=64.67566 nsp_loss=0.04347 nsp_acc=98.400 throughput=128.0K tks/s lr=0.0000645 time=129.21 INFO:root:[step 354999] Saving checkpoints to /home/ubuntu/ckpt-master/0354999.params, /home/ubuntu/ckpt-master/0354999.states. INFO:root:[step 355249] mlm_loss=1.47171 mlm_acc=66.46326 nsp_loss=0.05344 nsp_acc=98.035 throughput=100.0K tks/s lr=0.0000645 time=120.32 INFO:root:[step 355499] mlm_loss=1.60697 mlm_acc=65.21460 nsp_loss=0.04981 nsp_acc=98.123 throughput=126.0K tks/s lr=0.0000645 time=109.85 INFO:root:[step 355749] mlm_loss=1.58175 mlm_acc=65.35705 nsp_loss=0.04495 nsp_acc=98.431 throughput=120.0K tks/s lr=0.0000644 time=120.94 INFO:root:[step 355999] mlm_loss=1.85768 mlm_acc=62.01127 nsp_loss=0.05969 nsp_acc=97.670 throughput=147.0K tks/s lr=0.0000644 time=145.42 INFO:root:[step 356249] mlm_loss=1.70129 mlm_acc=65.00860 nsp_loss=0.04076 nsp_acc=98.510 throughput=129.0K tks/s lr=0.0000644 time=125.63 INFO:root:[step 356499] mlm_loss=1.63752 mlm_acc=65.35123 nsp_loss=0.04051 nsp_acc=98.552 throughput=130.0K tks/s lr=0.0000644 time=116.27 INFO:root:[step 356749] mlm_loss=1.55896 mlm_acc=66.37902 nsp_loss=0.04173 nsp_acc=98.500 throughput=126.0K tks/s lr=0.0000643 time=112.37 INFO:root:[step 356999] mlm_loss=1.87476 mlm_acc=61.37046 nsp_loss=0.05001 nsp_acc=98.169 throughput=142.0K tks/s lr=0.0000643 time=157.31 INFO:root:[step 357249] mlm_loss=1.53368 mlm_acc=66.27890 nsp_loss=0.04447 nsp_acc=98.372 throughput=124.0K tks/s lr=0.0000643 time=109.35 INFO:root:[step 357499] mlm_loss=1.65956 mlm_acc=63.82063 nsp_loss=0.11700 nsp_acc=95.078 throughput=127.0K tks/s lr=0.0000643 time=128.09 INFO:root:[step 357749] mlm_loss=1.62306 mlm_acc=65.17078 nsp_loss=0.04686 nsp_acc=98.236 throughput=131.0K tks/s lr=0.0000642 time=115.22 INFO:root:[step 357999] mlm_loss=1.59863 mlm_acc=65.59166 nsp_loss=0.04600 nsp_acc=98.308 throughput=123.0K tks/s lr=0.0000642 time=111.02 INFO:root:[step 358249] mlm_loss=1.77883 mlm_acc=64.16313 nsp_loss=0.03790 nsp_acc=98.593 throughput=138.0K tks/s lr=0.0000642 time=135.01 INFO:root:[step 358499] mlm_loss=1.51437 mlm_acc=68.69011 nsp_loss=0.05367 nsp_acc=98.074 throughput=135.0K tks/s lr=0.0000642 time=135.61 INFO:root:[step 358749] mlm_loss=1.91338 mlm_acc=60.80037 nsp_loss=0.09455 nsp_acc=96.196 throughput=130.0K tks/s lr=0.0000641 time=129.90 INFO:root:[step 358999] mlm_loss=1.55598 mlm_acc=66.13842 nsp_loss=0.04442 nsp_acc=98.323 throughput=127.0K tks/s lr=0.0000641 time=112.44 INFO:root:[step 359249] mlm_loss=1.67277 mlm_acc=64.16085 nsp_loss=0.07839 nsp_acc=96.885 throughput=146.0K tks/s lr=0.0000641 time=142.51 INFO:root:[step 359499] mlm_loss=1.83385 mlm_acc=62.61438 nsp_loss=0.05374 nsp_acc=97.923 throughput=143.0K tks/s lr=0.0000641 time=135.98 INFO:root:[step 359749] mlm_loss=1.65569 mlm_acc=63.80957 nsp_loss=0.04693 nsp_acc=98.239 throughput=128.0K tks/s lr=0.0000640 time=125.20 INFO:root:[step 359999] mlm_loss=1.82382 mlm_acc=62.61703 nsp_loss=0.06681 nsp_acc=97.360 throughput=156.0K tks/s lr=0.0000640 time=154.20 INFO:root:[step 359999] Saving checkpoints to /home/ubuntu/ckpt-master/0359999.params, /home/ubuntu/ckpt-master/0359999.states. INFO:root:[step 360249] mlm_loss=1.60674 mlm_acc=65.33926 nsp_loss=0.04179 nsp_acc=98.469 throughput=111.0K tks/s lr=0.0000640 time=136.50 INFO:root:[step 360499] mlm_loss=1.80084 mlm_acc=63.87121 nsp_loss=0.03696 nsp_acc=98.627 throughput=141.0K tks/s lr=0.0000640 time=140.31 INFO:root:[step 360749] mlm_loss=1.76406 mlm_acc=62.77041 nsp_loss=0.04957 nsp_acc=98.096 throughput=143.0K tks/s lr=0.0000639 time=144.47 INFO:root:[step 360999] mlm_loss=1.65171 mlm_acc=62.04652 nsp_loss=0.06482 nsp_acc=97.633 throughput=136.0K tks/s lr=0.0000639 time=133.74 INFO:root:[step 361249] mlm_loss=1.81176 mlm_acc=62.17237 nsp_loss=0.04603 nsp_acc=98.286 throughput=147.0K tks/s lr=0.0000639 time=151.74 INFO:root:[step 361499] mlm_loss=1.52643 mlm_acc=66.49463 nsp_loss=0.04340 nsp_acc=98.453 throughput=119.0K tks/s lr=0.0000639 time=108.01 INFO:root:[step 361749] mlm_loss=1.64098 mlm_acc=63.77452 nsp_loss=0.05341 nsp_acc=98.019 throughput=138.0K tks/s lr=0.0000638 time=135.08 INFO:root:[step 361999] mlm_loss=1.66641 mlm_acc=63.77655 nsp_loss=0.06956 nsp_acc=97.247 throughput=140.0K tks/s lr=0.0000638 time=136.57 INFO:root:[step 362249] mlm_loss=1.67980 mlm_acc=64.91317 nsp_loss=0.04258 nsp_acc=98.453 throughput=134.0K tks/s lr=0.0000638 time=119.44 INFO:root:[step 362499] mlm_loss=1.40755 mlm_acc=66.77770 nsp_loss=0.05245 nsp_acc=98.069 throughput=112.0K tks/s lr=0.0000638 time=112.93 INFO:root:[step 362749] mlm_loss=1.59285 mlm_acc=64.02078 nsp_loss=0.07268 nsp_acc=97.203 throughput=143.0K tks/s lr=0.0000637 time=132.90 INFO:root:[step 362999] mlm_loss=1.76019 mlm_acc=62.08473 nsp_loss=0.05690 nsp_acc=97.804 throughput=140.0K tks/s lr=0.0000637 time=138.68 INFO:root:[step 363249] mlm_loss=1.78327 mlm_acc=63.46301 nsp_loss=0.06106 nsp_acc=97.547 throughput=149.0K tks/s lr=0.0000637 time=142.74 INFO:root:[step 363499] mlm_loss=1.74348 mlm_acc=64.27467 nsp_loss=0.04554 nsp_acc=98.252 throughput=136.0K tks/s lr=0.0000637 time=132.68 INFO:root:[step 363749] mlm_loss=1.52386 mlm_acc=66.58376 nsp_loss=0.04309 nsp_acc=98.480 throughput=116.0K tks/s lr=0.0000636 time=119.13 INFO:root:[step 363999] mlm_loss=1.53703 mlm_acc=66.30583 nsp_loss=0.05229 nsp_acc=98.078 throughput=123.0K tks/s lr=0.0000636 time=112.62 INFO:root:[step 364249] mlm_loss=1.59768 mlm_acc=66.02812 nsp_loss=0.04504 nsp_acc=98.299 throughput=124.0K tks/s lr=0.0000636 time=111.56 INFO:root:[step 364499] mlm_loss=1.70725 mlm_acc=64.99974 nsp_loss=0.03950 nsp_acc=98.565 throughput=136.0K tks/s lr=0.0000636 time=131.80 INFO:root:[step 364749] mlm_loss=1.66861 mlm_acc=64.76770 nsp_loss=0.05617 nsp_acc=97.865 throughput=133.0K tks/s lr=0.0000635 time=132.67 INFO:root:[step 364999] mlm_loss=1.65922 mlm_acc=64.45736 nsp_loss=0.08371 nsp_acc=96.529 throughput=133.0K tks/s lr=0.0000635 time=133.23 INFO:root:[step 364999] Saving checkpoints to /home/ubuntu/ckpt-master/0364999.params, /home/ubuntu/ckpt-master/0364999.states. INFO:root:[step 365249] mlm_loss=1.68267 mlm_acc=64.10287 nsp_loss=0.11026 nsp_acc=95.145 throughput=120.0K tks/s lr=0.0000635 time=140.09 INFO:root:[step 365499] mlm_loss=1.55048 mlm_acc=66.14832 nsp_loss=0.04417 nsp_acc=98.398 throughput=124.0K tks/s lr=0.0000635 time=109.00 INFO:root:[step 365749] mlm_loss=1.72725 mlm_acc=62.63163 nsp_loss=0.05353 nsp_acc=98.029 throughput=137.0K tks/s lr=0.0000634 time=134.76 INFO:root:[step 365999] mlm_loss=1.86547 mlm_acc=62.04689 nsp_loss=0.06178 nsp_acc=97.581 throughput=144.0K tks/s lr=0.0000634 time=157.66 INFO:root:[step 366249] mlm_loss=1.54020 mlm_acc=65.95089 nsp_loss=0.04469 nsp_acc=98.409 throughput=124.0K tks/s lr=0.0000634 time=109.51 INFO:root:[step 366499] mlm_loss=1.65238 mlm_acc=65.32067 nsp_loss=0.04245 nsp_acc=98.499 throughput=125.0K tks/s lr=0.0000634 time=127.16 INFO:root:[step 366749] mlm_loss=1.35883 mlm_acc=67.69084 nsp_loss=0.05632 nsp_acc=97.963 throughput=115.0K tks/s lr=0.0000633 time=105.37 INFO:root:[step 366999] mlm_loss=1.59216 mlm_acc=66.13854 nsp_loss=0.04246 nsp_acc=98.477 throughput=128.0K tks/s lr=0.0000633 time=111.24 INFO:root:[step 367249] mlm_loss=1.70377 mlm_acc=64.19144 nsp_loss=0.08500 nsp_acc=96.504 throughput=137.0K tks/s lr=0.0000633 time=139.10 INFO:root:[step 367499] mlm_loss=1.69299 mlm_acc=64.68214 nsp_loss=0.04316 nsp_acc=98.423 throughput=132.0K tks/s lr=0.0000633 time=129.27 INFO:root:[step 367749] mlm_loss=1.45930 mlm_acc=67.05179 nsp_loss=0.04864 nsp_acc=98.307 throughput=122.0K tks/s lr=0.0000632 time=108.34 INFO:root:[step 367999] mlm_loss=1.72402 mlm_acc=63.61944 nsp_loss=0.04055 nsp_acc=98.480 throughput=139.0K tks/s lr=0.0000632 time=133.22 INFO:root:[step 368249] mlm_loss=1.77203 mlm_acc=64.22972 nsp_loss=0.04046 nsp_acc=98.550 throughput=138.0K tks/s lr=0.0000632 time=134.52 INFO:root:[step 368499] mlm_loss=1.60415 mlm_acc=65.58147 nsp_loss=0.04222 nsp_acc=98.460 throughput=130.0K tks/s lr=0.0000632 time=114.27 INFO:root:[step 368749] mlm_loss=1.67624 mlm_acc=64.65247 nsp_loss=0.04096 nsp_acc=98.504 throughput=129.0K tks/s lr=0.0000631 time=128.95 INFO:root:[step 368999] mlm_loss=1.52626 mlm_acc=66.71789 nsp_loss=0.04494 nsp_acc=98.373 throughput=119.0K tks/s lr=0.0000631 time=104.68 INFO:root:[step 369249] mlm_loss=1.92811 mlm_acc=61.01570 nsp_loss=0.08104 nsp_acc=96.818 throughput=130.0K tks/s lr=0.0000631 time=130.67 INFO:root:[step 369499] mlm_loss=1.52262 mlm_acc=66.31401 nsp_loss=0.04576 nsp_acc=98.372 throughput=121.0K tks/s lr=0.0000631 time=111.42 INFO:root:[step 369749] mlm_loss=1.75974 mlm_acc=64.26068 nsp_loss=0.03600 nsp_acc=98.721 throughput=141.0K tks/s lr=0.0000630 time=137.29 INFO:root:[step 369999] mlm_loss=1.60686 mlm_acc=65.30731 nsp_loss=0.04692 nsp_acc=98.251 throughput=121.0K tks/s lr=0.0000630 time=120.55 INFO:root:[step 369999] Saving checkpoints to /home/ubuntu/ckpt-master/0369999.params, /home/ubuntu/ckpt-master/0369999.states. INFO:root:[step 370249] mlm_loss=1.81912 mlm_acc=62.63108 nsp_loss=0.05789 nsp_acc=97.768 throughput=143.0K tks/s lr=0.0000630 time=172.90 INFO:root:[step 370499] mlm_loss=1.66723 mlm_acc=64.87650 nsp_loss=0.04124 nsp_acc=98.487 throughput=131.0K tks/s lr=0.0000630 time=129.93 INFO:root:[step 370749] mlm_loss=1.75496 mlm_acc=62.22457 nsp_loss=0.08522 nsp_acc=96.627 throughput=150.0K tks/s lr=0.0000629 time=150.07 INFO:root:[step 370999] mlm_loss=1.66812 mlm_acc=63.84253 nsp_loss=0.06183 nsp_acc=97.584 throughput=123.0K tks/s lr=0.0000629 time=120.34 INFO:root:[step 371249] mlm_loss=1.85035 mlm_acc=62.06576 nsp_loss=0.09036 nsp_acc=96.375 throughput=150.0K tks/s lr=0.0000629 time=149.88 INFO:root:[step 371499] mlm_loss=1.69051 mlm_acc=65.18537 nsp_loss=0.04098 nsp_acc=98.451 throughput=129.0K tks/s lr=0.0000629 time=126.48 INFO:root:[step 371749] mlm_loss=1.65356 mlm_acc=64.78275 nsp_loss=0.07854 nsp_acc=96.909 throughput=138.0K tks/s lr=0.0000628 time=119.81 INFO:root:[step 371999] mlm_loss=1.64893 mlm_acc=64.70983 nsp_loss=0.05783 nsp_acc=97.788 throughput=132.0K tks/s lr=0.0000628 time=132.78 INFO:root:[step 372249] mlm_loss=1.64166 mlm_acc=64.17836 nsp_loss=0.10217 nsp_acc=95.887 throughput=129.0K tks/s lr=0.0000628 time=132.27 INFO:root:[step 372499] mlm_loss=1.64939 mlm_acc=62.96926 nsp_loss=0.05267 nsp_acc=98.060 throughput=139.0K tks/s lr=0.0000628 time=120.01 INFO:root:[step 372749] mlm_loss=1.54296 mlm_acc=65.05917 nsp_loss=0.05908 nsp_acc=97.791 throughput=116.0K tks/s lr=0.0000627 time=118.69 INFO:root:[step 372999] mlm_loss=1.55889 mlm_acc=65.28490 nsp_loss=0.08269 nsp_acc=96.794 throughput=137.0K tks/s lr=0.0000627 time=126.67 INFO:root:[step 373249] mlm_loss=1.71180 mlm_acc=63.40213 nsp_loss=0.07057 nsp_acc=97.300 throughput=147.0K tks/s lr=0.0000627 time=160.35 INFO:root:[step 373499] mlm_loss=1.69034 mlm_acc=65.05723 nsp_loss=0.04063 nsp_acc=98.532 throughput=138.0K tks/s lr=0.0000627 time=118.54 INFO:root:[step 373749] mlm_loss=1.55391 mlm_acc=66.21058 nsp_loss=0.04353 nsp_acc=98.441 throughput=114.0K tks/s lr=0.0000626 time=118.75 INFO:root:[step 373999] mlm_loss=1.72530 mlm_acc=64.50596 nsp_loss=0.03680 nsp_acc=98.675 throughput=145.0K tks/s lr=0.0000626 time=126.91 INFO:root:[step 374249] mlm_loss=1.61532 mlm_acc=64.01704 nsp_loss=0.05452 nsp_acc=97.929 throughput=130.0K tks/s lr=0.0000626 time=129.95 INFO:root:[step 374499] mlm_loss=1.59231 mlm_acc=64.73009 nsp_loss=0.05559 nsp_acc=97.962 throughput=120.0K tks/s lr=0.0000626 time=124.62 INFO:root:[step 374749] mlm_loss=1.55081 mlm_acc=65.99332 nsp_loss=0.04140 nsp_acc=98.499 throughput=125.0K tks/s lr=0.0000625 time=112.60 INFO:root:[step 374999] mlm_loss=1.51722 mlm_acc=66.60600 nsp_loss=0.04237 nsp_acc=98.419 throughput=121.0K tks/s lr=0.0000625 time=109.63 INFO:root:[step 374999] Saving checkpoints to /home/ubuntu/ckpt-master/0374999.params, /home/ubuntu/ckpt-master/0374999.states. INFO:root:[step 375249] mlm_loss=1.71949 mlm_acc=64.52699 nsp_loss=0.03892 nsp_acc=98.590 throughput=121.0K tks/s lr=0.0000625 time=149.24 INFO:root:[step 375499] mlm_loss=1.71697 mlm_acc=64.57229 nsp_loss=0.03928 nsp_acc=98.521 throughput=130.0K tks/s lr=0.0000625 time=128.93 INFO:root:[step 375749] mlm_loss=1.58196 mlm_acc=65.75967 nsp_loss=0.04534 nsp_acc=98.390 throughput=126.0K tks/s lr=0.0000624 time=112.79 INFO:root:[step 375999] mlm_loss=1.64538 mlm_acc=65.11467 nsp_loss=0.04567 nsp_acc=98.346 throughput=127.0K tks/s lr=0.0000624 time=126.97 INFO:root:[step 376249] mlm_loss=1.65306 mlm_acc=64.80444 nsp_loss=0.04494 nsp_acc=98.384 throughput=139.0K tks/s lr=0.0000624 time=117.45 INFO:root:[step 376499] mlm_loss=1.52640 mlm_acc=66.57486 nsp_loss=0.04281 nsp_acc=98.439 throughput=114.0K tks/s lr=0.0000624 time=118.87 INFO:root:[step 376749] mlm_loss=1.55191 mlm_acc=66.38879 nsp_loss=0.04252 nsp_acc=98.440 throughput=123.0K tks/s lr=0.0000623 time=110.07 INFO:root:[step 376999] mlm_loss=1.51671 mlm_acc=66.88758 nsp_loss=0.04292 nsp_acc=98.463 throughput=120.0K tks/s lr=0.0000623 time=107.60 INFO:root:[step 377249] mlm_loss=1.77439 mlm_acc=63.12547 nsp_loss=0.09103 nsp_acc=96.186 throughput=141.0K tks/s lr=0.0000623 time=157.40 INFO:root:[step 377499] mlm_loss=1.69848 mlm_acc=63.39274 nsp_loss=0.06395 nsp_acc=97.519 throughput=143.0K tks/s lr=0.0000623 time=139.09 INFO:root:[step 377749] mlm_loss=1.69579 mlm_acc=65.01230 nsp_loss=0.04302 nsp_acc=98.434 throughput=141.0K tks/s lr=0.0000622 time=123.62 INFO:root:[step 377999] mlm_loss=1.63848 mlm_acc=65.26488 nsp_loss=0.04295 nsp_acc=98.415 throughput=125.0K tks/s lr=0.0000622 time=122.61 INFO:root:[step 378249] mlm_loss=1.77621 mlm_acc=63.44247 nsp_loss=0.07439 nsp_acc=96.969 throughput=151.0K tks/s lr=0.0000622 time=150.15 INFO:root:[step 378499] mlm_loss=1.54743 mlm_acc=66.08062 nsp_loss=0.04297 nsp_acc=98.453 throughput=118.0K tks/s lr=0.0000622 time=122.73 INFO:root:[step 378749] mlm_loss=1.55914 mlm_acc=66.11025 nsp_loss=0.04217 nsp_acc=98.483 throughput=128.0K tks/s lr=0.0000621 time=109.32 INFO:root:[step 378999] mlm_loss=1.72078 mlm_acc=64.90302 nsp_loss=0.03976 nsp_acc=98.542 throughput=131.0K tks/s lr=0.0000621 time=131.48 INFO:root:[step 379249] mlm_loss=1.75247 mlm_acc=62.31029 nsp_loss=0.06064 nsp_acc=97.739 throughput=144.0K tks/s lr=0.0000621 time=141.91 INFO:root:[step 379499] mlm_loss=1.77062 mlm_acc=63.89532 nsp_loss=0.03765 nsp_acc=98.609 throughput=139.0K tks/s lr=0.0000621 time=141.23 INFO:root:[step 379749] mlm_loss=1.50542 mlm_acc=66.81285 nsp_loss=0.04639 nsp_acc=98.331 throughput=113.0K tks/s lr=0.0000620 time=106.91 INFO:root:[step 379999] mlm_loss=1.58521 mlm_acc=65.88292 nsp_loss=0.04439 nsp_acc=98.418 throughput=126.0K tks/s lr=0.0000620 time=111.77 INFO:root:[step 379999] Saving checkpoints to /home/ubuntu/ckpt-master/0379999.params, /home/ubuntu/ckpt-master/0379999.states. INFO:root:[step 380249] mlm_loss=1.59079 mlm_acc=65.00119 nsp_loss=0.05522 nsp_acc=97.987 throughput=119.0K tks/s lr=0.0000620 time=146.73 INFO:root:[step 380499] mlm_loss=1.62395 mlm_acc=65.34465 nsp_loss=0.04469 nsp_acc=98.364 throughput=127.0K tks/s lr=0.0000620 time=129.63 INFO:root:[step 380749] mlm_loss=1.64144 mlm_acc=65.38254 nsp_loss=0.04259 nsp_acc=98.499 throughput=131.0K tks/s lr=0.0000619 time=115.54 INFO:root:[step 380999] mlm_loss=1.77844 mlm_acc=63.94486 nsp_loss=0.03657 nsp_acc=98.667 throughput=143.0K tks/s lr=0.0000619 time=139.66 INFO:root:[step 381249] mlm_loss=1.78977 mlm_acc=62.92908 nsp_loss=0.05431 nsp_acc=97.985 throughput=141.0K tks/s lr=0.0000619 time=140.13 INFO:root:[step 381499] mlm_loss=1.68672 mlm_acc=63.99558 nsp_loss=0.08165 nsp_acc=96.793 throughput=145.0K tks/s lr=0.0000619 time=144.86 INFO:root:[step 381749] mlm_loss=1.80470 mlm_acc=63.58831 nsp_loss=0.03623 nsp_acc=98.771 throughput=147.0K tks/s lr=0.0000618 time=142.65 INFO:root:[step 381999] mlm_loss=1.94478 mlm_acc=59.59852 nsp_loss=0.08654 nsp_acc=96.611 throughput=143.0K tks/s lr=0.0000618 time=163.38 INFO:root:[step 382249] mlm_loss=1.57004 mlm_acc=64.98112 nsp_loss=0.08462 nsp_acc=96.581 throughput=136.0K tks/s lr=0.0000618 time=138.12 INFO:root:[step 382499] mlm_loss=1.52679 mlm_acc=65.88486 nsp_loss=0.04745 nsp_acc=98.312 throughput=125.0K tks/s lr=0.0000618 time=112.86 INFO:root:[step 382749] mlm_loss=1.81479 mlm_acc=62.24358 nsp_loss=0.08901 nsp_acc=96.485 throughput=150.0K tks/s lr=0.0000617 time=150.37 INFO:root:[step 382999] mlm_loss=1.84092 mlm_acc=62.78198 nsp_loss=0.03819 nsp_acc=98.596 throughput=151.0K tks/s lr=0.0000617 time=149.28 INFO:root:[step 383249] mlm_loss=1.46148 mlm_acc=66.60861 nsp_loss=0.04214 nsp_acc=98.465 throughput=111.0K tks/s lr=0.0000617 time=115.99 INFO:root:[step 383499] mlm_loss=1.58650 mlm_acc=66.13064 nsp_loss=0.03270 nsp_acc=98.860 throughput=128.0K tks/s lr=0.0000617 time=115.26 INFO:root:[step 383749] mlm_loss=1.78286 mlm_acc=62.01978 nsp_loss=0.09767 nsp_acc=96.007 throughput=150.0K tks/s lr=0.0000616 time=152.08 INFO:root:[step 383999] mlm_loss=1.69798 mlm_acc=64.52577 nsp_loss=0.07439 nsp_acc=97.084 throughput=152.0K tks/s lr=0.0000616 time=167.46 INFO:root:[step 384249] mlm_loss=1.56807 mlm_acc=64.68518 nsp_loss=0.05117 nsp_acc=98.084 throughput=134.0K tks/s lr=0.0000616 time=124.14 INFO:root:[step 384499] mlm_loss=1.79314 mlm_acc=63.48272 nsp_loss=0.03125 nsp_acc=98.899 throughput=144.0K tks/s lr=0.0000616 time=151.41 INFO:root:[step 384749] mlm_loss=1.76324 mlm_acc=63.42127 nsp_loss=0.05385 nsp_acc=97.894 throughput=150.0K tks/s lr=0.0000615 time=150.84 INFO:root:[step 384999] mlm_loss=1.50959 mlm_acc=66.33639 nsp_loss=0.03691 nsp_acc=98.651 throughput=128.0K tks/s lr=0.0000615 time=109.99 INFO:root:[step 384999] Saving checkpoints to /home/ubuntu/ckpt-master/0384999.params, /home/ubuntu/ckpt-master/0384999.states. INFO:root:[step 385249] mlm_loss=1.56829 mlm_acc=66.14859 nsp_loss=0.03484 nsp_acc=98.781 throughput=107.0K tks/s lr=0.0000615 time=138.33 INFO:root:[step 385499] mlm_loss=1.49706 mlm_acc=66.84322 nsp_loss=0.03312 nsp_acc=98.832 throughput=127.0K tks/s lr=0.0000615 time=109.34 INFO:root:[step 385749] mlm_loss=1.63735 mlm_acc=65.14036 nsp_loss=0.03159 nsp_acc=98.868 throughput=132.0K tks/s lr=0.0000614 time=130.50 INFO:root:[step 385999] mlm_loss=1.56313 mlm_acc=65.97634 nsp_loss=0.03939 nsp_acc=98.622 throughput=127.0K tks/s lr=0.0000614 time=111.83 INFO:root:[step 386249] mlm_loss=1.81575 mlm_acc=62.22725 nsp_loss=0.08882 nsp_acc=96.370 throughput=152.0K tks/s lr=0.0000614 time=167.44 INFO:root:[step 386499] mlm_loss=1.76258 mlm_acc=63.23391 nsp_loss=0.05718 nsp_acc=97.682 throughput=154.0K tks/s lr=0.0000614 time=150.72 INFO:root:[step 386749] mlm_loss=1.72204 mlm_acc=63.57450 nsp_loss=0.08282 nsp_acc=96.651 throughput=140.0K tks/s lr=0.0000613 time=141.14 INFO:root:[step 386999] mlm_loss=1.56275 mlm_acc=66.10332 nsp_loss=0.04214 nsp_acc=98.508 throughput=127.0K tks/s lr=0.0000613 time=113.19 INFO:root:[step 387249] mlm_loss=1.65270 mlm_acc=65.42705 nsp_loss=0.03048 nsp_acc=98.934 throughput=132.0K tks/s lr=0.0000613 time=130.62 INFO:root:[step 387499] mlm_loss=1.73135 mlm_acc=63.62882 nsp_loss=0.06227 nsp_acc=97.480 throughput=143.0K tks/s lr=0.0000613 time=139.35 INFO:root:[step 387749] mlm_loss=1.58360 mlm_acc=65.02679 nsp_loss=0.05393 nsp_acc=97.988 throughput=123.0K tks/s lr=0.0000612 time=125.98 INFO:root:[step 387999] mlm_loss=1.42888 mlm_acc=67.45140 nsp_loss=0.03587 nsp_acc=98.770 throughput=118.0K tks/s lr=0.0000612 time=105.72 INFO:root:[step 388249] mlm_loss=1.63016 mlm_acc=64.23128 nsp_loss=0.06443 nsp_acc=97.480 throughput=142.0K tks/s lr=0.0000612 time=139.74 INFO:root:[step 388499] mlm_loss=1.66534 mlm_acc=64.99489 nsp_loss=0.03526 nsp_acc=98.679 throughput=128.0K tks/s lr=0.0000612 time=130.93 INFO:root:[step 388749] mlm_loss=1.26482 mlm_acc=68.78642 nsp_loss=0.04882 nsp_acc=98.261 throughput=103.0K tks/s lr=0.0000611 time=100.29 INFO:root:[step 388999] mlm_loss=1.69820 mlm_acc=63.46925 nsp_loss=0.05705 nsp_acc=97.822 throughput=130.0K tks/s lr=0.0000611 time=114.93 INFO:root:[step 389249] mlm_loss=1.72676 mlm_acc=63.70996 nsp_loss=0.04717 nsp_acc=98.259 throughput=126.0K tks/s lr=0.0000611 time=124.93 INFO:root:[step 389499] mlm_loss=1.61521 mlm_acc=65.57909 nsp_loss=0.03819 nsp_acc=98.591 throughput=132.0K tks/s lr=0.0000611 time=116.97 INFO:root:[step 389749] mlm_loss=1.49792 mlm_acc=66.62987 nsp_loss=0.03416 nsp_acc=98.759 throughput=117.0K tks/s lr=0.0000610 time=116.87 INFO:root:[step 389999] mlm_loss=1.60094 mlm_acc=63.91497 nsp_loss=0.05248 nsp_acc=98.022 throughput=141.0K tks/s lr=0.0000610 time=130.18 INFO:root:[step 389999] Saving checkpoints to /home/ubuntu/ckpt-master/0389999.params, /home/ubuntu/ckpt-master/0389999.states. INFO:root:[step 390249] mlm_loss=1.63598 mlm_acc=64.02734 nsp_loss=0.09007 nsp_acc=96.389 throughput=122.0K tks/s lr=0.0000610 time=149.92 INFO:root:[step 390499] mlm_loss=1.74177 mlm_acc=63.08463 nsp_loss=0.05922 nsp_acc=97.694 throughput=143.0K tks/s lr=0.0000610 time=139.08 INFO:root:[step 390749] mlm_loss=1.54231 mlm_acc=66.47069 nsp_loss=0.03754 nsp_acc=98.625 throughput=123.0K tks/s lr=0.0000609 time=109.82 INFO:root:[step 390999] mlm_loss=1.58279 mlm_acc=65.96306 nsp_loss=0.03837 nsp_acc=98.617 throughput=119.0K tks/s lr=0.0000609 time=123.08 INFO:root:[step 391249] mlm_loss=1.81667 mlm_acc=62.67857 nsp_loss=0.07226 nsp_acc=97.118 throughput=151.0K tks/s lr=0.0000609 time=149.50 INFO:root:[step 391499] mlm_loss=1.67355 mlm_acc=64.06959 nsp_loss=0.06233 nsp_acc=97.583 throughput=136.0K tks/s lr=0.0000609 time=137.48 INFO:root:[step 391749] mlm_loss=1.84601 mlm_acc=62.80499 nsp_loss=0.05472 nsp_acc=97.834 throughput=142.0K tks/s lr=0.0000608 time=142.50 INFO:root:[step 391999] mlm_loss=1.71122 mlm_acc=64.02379 nsp_loss=0.08493 nsp_acc=96.607 throughput=146.0K tks/s lr=0.0000608 time=145.03 INFO:root:[step 392249] mlm_loss=1.58169 mlm_acc=65.87580 nsp_loss=0.03917 nsp_acc=98.523 throughput=131.0K tks/s lr=0.0000608 time=117.37 INFO:root:[step 392499] mlm_loss=1.54851 mlm_acc=66.49778 nsp_loss=0.03965 nsp_acc=98.588 throughput=118.0K tks/s lr=0.0000608 time=123.22 INFO:root:[step 392749] mlm_loss=1.59478 mlm_acc=63.01356 nsp_loss=0.05462 nsp_acc=98.030 throughput=142.0K tks/s lr=0.0000607 time=127.21 INFO:root:[step 392999] mlm_loss=1.58545 mlm_acc=65.93106 nsp_loss=0.03670 nsp_acc=98.680 throughput=118.0K tks/s lr=0.0000607 time=120.25 INFO:root:[step 393249] mlm_loss=1.52941 mlm_acc=66.03688 nsp_loss=0.04247 nsp_acc=98.447 throughput=122.0K tks/s lr=0.0000607 time=110.56 INFO:root:[step 393499] mlm_loss=1.87822 mlm_acc=60.36510 nsp_loss=0.06935 nsp_acc=97.280 throughput=142.0K tks/s lr=0.0000607 time=164.27 INFO:root:[step 393749] mlm_loss=1.28684 mlm_acc=68.13212 nsp_loss=0.05183 nsp_acc=98.176 throughput=109.0K tks/s lr=0.0000606 time=97.22 INFO:root:[step 393999] mlm_loss=1.64642 mlm_acc=64.53832 nsp_loss=0.03657 nsp_acc=98.755 throughput=137.0K tks/s lr=0.0000606 time=123.71 INFO:root:[step 394249] mlm_loss=1.56986 mlm_acc=66.08991 nsp_loss=0.03993 nsp_acc=98.585 throughput=117.0K tks/s lr=0.0000606 time=117.08 INFO:root:[step 394499] mlm_loss=1.75316 mlm_acc=64.33941 nsp_loss=0.03416 nsp_acc=98.778 throughput=138.0K tks/s lr=0.0000606 time=136.07 INFO:root:[step 394749] mlm_loss=1.58779 mlm_acc=65.97575 nsp_loss=0.04018 nsp_acc=98.522 throughput=130.0K tks/s lr=0.0000605 time=113.66 INFO:root:[step 394999] mlm_loss=1.80614 mlm_acc=62.18279 nsp_loss=0.03969 nsp_acc=98.499 throughput=146.0K tks/s lr=0.0000605 time=160.99 INFO:root:[step 394999] Saving checkpoints to /home/ubuntu/ckpt-master/0394999.params, /home/ubuntu/ckpt-master/0394999.states. INFO:root:[step 395249] mlm_loss=1.57051 mlm_acc=65.02411 nsp_loss=0.05595 nsp_acc=97.819 throughput=120.0K tks/s lr=0.0000605 time=129.78 INFO:root:[step 395499] mlm_loss=1.67791 mlm_acc=64.33749 nsp_loss=0.04955 nsp_acc=98.102 throughput=133.0K tks/s lr=0.0000605 time=132.68 INFO:root:[step 395749] mlm_loss=1.58120 mlm_acc=66.07673 nsp_loss=0.04077 nsp_acc=98.558 throughput=129.0K tks/s lr=0.0000604 time=113.88 INFO:root:[step 395999] mlm_loss=1.31674 mlm_acc=68.20704 nsp_loss=0.05328 nsp_acc=98.087 throughput=114.0K tks/s lr=0.0000604 time=105.89 INFO:root:[step 396249] mlm_loss=1.72167 mlm_acc=63.08390 nsp_loss=0.09002 nsp_acc=96.350 throughput=158.0K tks/s lr=0.0000604 time=176.79 INFO:root:[step 396499] mlm_loss=1.60220 mlm_acc=64.72904 nsp_loss=0.05080 nsp_acc=98.118 throughput=128.0K tks/s lr=0.0000604 time=134.49 INFO:root:[step 396749] mlm_loss=1.54521 mlm_acc=65.82931 nsp_loss=0.04182 nsp_acc=98.474 throughput=127.0K tks/s lr=0.0000603 time=112.11 INFO:root:[step 396999] mlm_loss=1.73641 mlm_acc=63.90717 nsp_loss=0.06640 nsp_acc=97.340 throughput=151.0K tks/s lr=0.0000603 time=150.76 INFO:root:[step 397249] mlm_loss=1.63954 mlm_acc=65.18532 nsp_loss=0.03480 nsp_acc=98.787 throughput=125.0K tks/s lr=0.0000603 time=126.14 INFO:root:[step 397499] mlm_loss=1.71890 mlm_acc=63.13586 nsp_loss=0.05908 nsp_acc=97.673 throughput=149.0K tks/s lr=0.0000603 time=144.84 INFO:root:[step 397749] mlm_loss=1.57646 mlm_acc=65.79229 nsp_loss=0.03828 nsp_acc=98.616 throughput=122.0K tks/s lr=0.0000602 time=126.74 INFO:root:[step 397999] mlm_loss=1.54408 mlm_acc=66.10858 nsp_loss=0.04160 nsp_acc=98.511 throughput=125.0K tks/s lr=0.0000602 time=108.64 INFO:root:[step 398249] mlm_loss=1.52893 mlm_acc=66.23918 nsp_loss=0.03953 nsp_acc=98.585 throughput=122.0K tks/s lr=0.0000602 time=109.56 INFO:root:[step 398499] mlm_loss=1.63129 mlm_acc=65.52957 nsp_loss=0.03605 nsp_acc=98.719 throughput=130.0K tks/s lr=0.0000602 time=125.65 INFO:root:[step 398749] mlm_loss=1.80406 mlm_acc=62.70125 nsp_loss=0.06018 nsp_acc=97.761 throughput=154.0K tks/s lr=0.0000601 time=153.76 INFO:root:[step 398999] mlm_loss=1.52040 mlm_acc=66.14412 nsp_loss=0.04298 nsp_acc=98.463 throughput=113.0K tks/s lr=0.0000601 time=119.59 INFO:root:[step 399249] mlm_loss=1.52799 mlm_acc=66.34255 nsp_loss=0.04353 nsp_acc=98.398 throughput=123.0K tks/s lr=0.0000601 time=107.77 INFO:root:[step 399499] mlm_loss=1.47159 mlm_acc=66.44598 nsp_loss=0.05336 nsp_acc=98.022 throughput=118.0K tks/s lr=0.0000601 time=108.08 INFO:root:[step 399749] mlm_loss=1.47239 mlm_acc=66.95254 nsp_loss=0.04443 nsp_acc=98.384 throughput=118.0K tks/s lr=0.0000600 time=107.28 INFO:root:[step 399999] mlm_loss=1.76652 mlm_acc=64.35540 nsp_loss=0.03160 nsp_acc=98.857 throughput=140.0K tks/s lr=0.0000600 time=137.85 INFO:root:[step 399999] Saving checkpoints to /home/ubuntu/ckpt-master/0399999.params, /home/ubuntu/ckpt-master/0399999.states. INFO:root:[step 400249] mlm_loss=1.75015 mlm_acc=63.40164 nsp_loss=0.04459 nsp_acc=98.355 throughput=129.0K tks/s lr=0.0000600 time=170.42 INFO:root:[step 400499] mlm_loss=1.73858 mlm_acc=62.83698 nsp_loss=0.05875 nsp_acc=97.750 throughput=147.0K tks/s lr=0.0000600 time=128.60 INFO:root:[step 400749] mlm_loss=1.81781 mlm_acc=62.70367 nsp_loss=0.03684 nsp_acc=98.608 throughput=149.0K tks/s lr=0.0000599 time=164.51 INFO:root:[step 400999] mlm_loss=1.74701 mlm_acc=63.79988 nsp_loss=0.05595 nsp_acc=97.876 throughput=148.0K tks/s lr=0.0000599 time=146.19 INFO:root:[step 401249] mlm_loss=1.63364 mlm_acc=65.35955 nsp_loss=0.03950 nsp_acc=98.576 throughput=127.0K tks/s lr=0.0000599 time=123.92 INFO:root:[step 401499] mlm_loss=1.70428 mlm_acc=64.90310 nsp_loss=0.03213 nsp_acc=98.883 throughput=145.0K tks/s lr=0.0000599 time=128.64 INFO:root:[step 401749] mlm_loss=1.58234 mlm_acc=64.69332 nsp_loss=0.06373 nsp_acc=97.586 throughput=137.0K tks/s lr=0.0000598 time=136.07 INFO:root:[step 401999] mlm_loss=1.60304 mlm_acc=63.65270 nsp_loss=0.05921 nsp_acc=97.730 throughput=133.0K tks/s lr=0.0000598 time=135.06 INFO:root:[step 402249] mlm_loss=1.44328 mlm_acc=67.15584 nsp_loss=0.03831 nsp_acc=98.618 throughput=120.0K tks/s lr=0.0000598 time=106.74 INFO:root:[step 402499] mlm_loss=1.53479 mlm_acc=66.33116 nsp_loss=0.03701 nsp_acc=98.707 throughput=119.0K tks/s lr=0.0000598 time=120.69 INFO:root:[step 402749] mlm_loss=1.59745 mlm_acc=65.67634 nsp_loss=0.03814 nsp_acc=98.675 throughput=134.0K tks/s lr=0.0000597 time=115.22 INFO:root:[step 402999] mlm_loss=1.77255 mlm_acc=62.31461 nsp_loss=0.04480 nsp_acc=98.344 throughput=140.0K tks/s lr=0.0000597 time=140.21 INFO:root:[step 403249] mlm_loss=1.73255 mlm_acc=63.40515 nsp_loss=0.05086 nsp_acc=98.028 throughput=147.0K tks/s lr=0.0000597 time=144.43 INFO:root:[step 403499] mlm_loss=1.48950 mlm_acc=66.26705 nsp_loss=0.04560 nsp_acc=98.348 throughput=115.0K tks/s lr=0.0000597 time=123.10 INFO:root:[step 403749] mlm_loss=1.55560 mlm_acc=66.00863 nsp_loss=0.03917 nsp_acc=98.586 throughput=129.0K tks/s lr=0.0000596 time=115.12 INFO:root:[step 403999] mlm_loss=1.55279 mlm_acc=68.28518 nsp_loss=0.04872 nsp_acc=98.283 throughput=141.0K tks/s lr=0.0000596 time=142.52 INFO:root:[step 404249] mlm_loss=1.44929 mlm_acc=67.11064 nsp_loss=0.04581 nsp_acc=98.399 throughput=116.0K tks/s lr=0.0000596 time=116.57 INFO:root:[step 404499] mlm_loss=1.70681 mlm_acc=63.91860 nsp_loss=0.05070 nsp_acc=98.099 throughput=144.0K tks/s lr=0.0000596 time=147.93 INFO:root:[step 404749] mlm_loss=1.72327 mlm_acc=62.55700 nsp_loss=0.04877 nsp_acc=98.165 throughput=146.0K tks/s lr=0.0000595 time=125.32 INFO:root:[step 404999] mlm_loss=1.55668 mlm_acc=65.54323 nsp_loss=0.03921 nsp_acc=98.634 throughput=125.0K tks/s lr=0.0000595 time=124.17 INFO:root:[step 404999] Saving checkpoints to /home/ubuntu/ckpt-master/0404999.params, /home/ubuntu/ckpt-master/0404999.states. INFO:root:[step 405249] mlm_loss=1.81239 mlm_acc=62.32806 nsp_loss=0.08140 nsp_acc=96.689 throughput=139.0K tks/s lr=0.0000595 time=167.48 INFO:root:[step 405499] mlm_loss=1.55321 mlm_acc=65.52759 nsp_loss=0.04880 nsp_acc=98.136 throughput=123.0K tks/s lr=0.0000595 time=127.40 INFO:root:[step 405749] mlm_loss=1.56617 mlm_acc=66.16027 nsp_loss=0.04310 nsp_acc=98.420 throughput=125.0K tks/s lr=0.0000594 time=111.92 INFO:root:[step 405999] mlm_loss=1.63957 mlm_acc=65.38567 nsp_loss=0.03857 nsp_acc=98.579 throughput=124.0K tks/s lr=0.0000594 time=127.09 INFO:root:[step 406249] mlm_loss=1.42504 mlm_acc=66.85913 nsp_loss=0.05747 nsp_acc=97.800 throughput=113.0K tks/s lr=0.0000594 time=106.53 INFO:root:[step 406499] mlm_loss=1.72237 mlm_acc=62.53678 nsp_loss=0.06681 nsp_acc=97.408 throughput=138.0K tks/s lr=0.0000594 time=131.38 INFO:root:[step 406749] mlm_loss=1.65190 mlm_acc=64.63781 nsp_loss=0.03730 nsp_acc=98.668 throughput=137.0K tks/s lr=0.0000593 time=123.81 INFO:root:[step 406999] mlm_loss=1.58788 mlm_acc=65.89838 nsp_loss=0.04069 nsp_acc=98.505 throughput=116.0K tks/s lr=0.0000593 time=119.70 INFO:root:[step 407249] mlm_loss=1.66889 mlm_acc=64.93038 nsp_loss=0.03321 nsp_acc=98.836 throughput=135.0K tks/s lr=0.0000593 time=131.72 INFO:root:[step 407499] mlm_loss=1.64462 mlm_acc=63.27715 nsp_loss=0.04745 nsp_acc=98.273 throughput=145.0K tks/s lr=0.0000593 time=128.20 INFO:root:[step 407749] mlm_loss=1.39199 mlm_acc=70.37565 nsp_loss=0.05529 nsp_acc=98.096 throughput=129.0K tks/s lr=0.0000592 time=127.61 INFO:root:[step 407999] mlm_loss=1.66083 mlm_acc=65.34623 nsp_loss=0.10405 nsp_acc=95.704 throughput=150.0K tks/s lr=0.0000592 time=149.85 INFO:root:[step 408249] mlm_loss=1.67729 mlm_acc=64.78430 nsp_loss=0.06540 nsp_acc=97.302 throughput=129.0K tks/s lr=0.0000592 time=127.65 INFO:root:[step 408499] mlm_loss=1.62100 mlm_acc=65.58640 nsp_loss=0.03748 nsp_acc=98.673 throughput=131.0K tks/s lr=0.0000592 time=116.13 INFO:root:[step 408749] mlm_loss=1.91796 mlm_acc=60.39725 nsp_loss=0.06556 nsp_acc=97.544 throughput=151.0K tks/s lr=0.0000591 time=167.02 INFO:root:[step 408999] mlm_loss=1.60366 mlm_acc=65.57819 nsp_loss=0.03961 nsp_acc=98.575 throughput=131.0K tks/s lr=0.0000591 time=116.79 INFO:root:[step 409249] mlm_loss=1.76432 mlm_acc=62.25871 nsp_loss=0.09385 nsp_acc=96.221 throughput=154.0K tks/s lr=0.0000591 time=155.80 INFO:root:[step 409499] mlm_loss=1.75505 mlm_acc=62.17242 nsp_loss=0.06241 nsp_acc=97.557 throughput=138.0K tks/s lr=0.0000591 time=137.70 INFO:root:[step 409749] mlm_loss=1.56667 mlm_acc=66.27339 nsp_loss=0.03771 nsp_acc=98.676 throughput=127.0K tks/s lr=0.0000590 time=126.26 INFO:root:[step 409999] mlm_loss=1.55069 mlm_acc=66.10852 nsp_loss=0.04580 nsp_acc=98.371 throughput=129.0K tks/s lr=0.0000590 time=125.19 INFO:root:[step 409999] Saving checkpoints to /home/ubuntu/ckpt-master/0409999.params, /home/ubuntu/ckpt-master/0409999.states. INFO:root:[step 410249] mlm_loss=1.36361 mlm_acc=70.07187 nsp_loss=0.11329 nsp_acc=95.375 throughput=138.0K tks/s lr=0.0000590 time=157.81 INFO:root:[step 410499] mlm_loss=1.66425 mlm_acc=65.28182 nsp_loss=0.03651 nsp_acc=98.665 throughput=135.0K tks/s lr=0.0000590 time=129.52 INFO:root:[step 410749] mlm_loss=1.58588 mlm_acc=66.02160 nsp_loss=0.04121 nsp_acc=98.539 throughput=121.0K tks/s lr=0.0000589 time=122.92 INFO:root:[step 410999] mlm_loss=1.55197 mlm_acc=66.37316 nsp_loss=0.04061 nsp_acc=98.605 throughput=127.0K tks/s lr=0.0000589 time=112.03 INFO:root:[step 411249] mlm_loss=1.62479 mlm_acc=65.65196 nsp_loss=0.03803 nsp_acc=98.638 throughput=122.0K tks/s lr=0.0000589 time=125.57 INFO:root:[step 411499] mlm_loss=1.63296 mlm_acc=63.31087 nsp_loss=0.05074 nsp_acc=98.120 throughput=141.0K tks/s lr=0.0000589 time=134.37 INFO:root:[step 411749] mlm_loss=1.75427 mlm_acc=62.39514 nsp_loss=0.06559 nsp_acc=97.452 throughput=132.0K tks/s lr=0.0000588 time=118.72 INFO:root:[step 411999] mlm_loss=1.52815 mlm_acc=66.37299 nsp_loss=0.03913 nsp_acc=98.575 throughput=115.0K tks/s lr=0.0000588 time=116.53 INFO:root:[step 412249] mlm_loss=1.62306 mlm_acc=65.73291 nsp_loss=0.03846 nsp_acc=98.682 throughput=127.0K tks/s lr=0.0000588 time=118.71 INFO:root:[step 412499] mlm_loss=1.68572 mlm_acc=64.20596 nsp_loss=0.03635 nsp_acc=98.700 throughput=135.0K tks/s lr=0.0000588 time=133.60 INFO:root:[step 412749] mlm_loss=1.47415 mlm_acc=66.93224 nsp_loss=0.04306 nsp_acc=98.504 throughput=117.0K tks/s lr=0.0000587 time=113.13 INFO:root:[step 412999] mlm_loss=1.79259 mlm_acc=62.01670 nsp_loss=0.08911 nsp_acc=96.461 throughput=145.0K tks/s lr=0.0000587 time=162.74 INFO:root:[step 413249] mlm_loss=1.54425 mlm_acc=65.21966 nsp_loss=0.04725 nsp_acc=98.255 throughput=142.0K tks/s lr=0.0000587 time=122.04 INFO:root:[step 413499] mlm_loss=1.52195 mlm_acc=65.19221 nsp_loss=0.05839 nsp_acc=97.814 throughput=126.0K tks/s lr=0.0000587 time=123.97 INFO:root:[step 413749] mlm_loss=1.58980 mlm_acc=64.74150 nsp_loss=0.05293 nsp_acc=98.048 throughput=128.0K tks/s lr=0.0000586 time=133.32 INFO:root:[step 413999] mlm_loss=1.63218 mlm_acc=63.96286 nsp_loss=0.06005 nsp_acc=97.720 throughput=132.0K tks/s lr=0.0000586 time=113.51 INFO:root:[step 414249] mlm_loss=1.77409 mlm_acc=63.12395 nsp_loss=0.09410 nsp_acc=96.168 throughput=142.0K tks/s lr=0.0000586 time=145.56 INFO:root:[step 414499] mlm_loss=1.84674 mlm_acc=61.39611 nsp_loss=0.06531 nsp_acc=97.296 throughput=151.0K tks/s lr=0.0000586 time=147.86 INFO:root:[step 414749] mlm_loss=1.78914 mlm_acc=62.71568 nsp_loss=0.06340 nsp_acc=97.549 throughput=147.0K tks/s lr=0.0000585 time=146.41 INFO:root:[step 414999] mlm_loss=1.55128 mlm_acc=66.59093 nsp_loss=0.04128 nsp_acc=98.530 throughput=120.0K tks/s lr=0.0000585 time=121.53 INFO:root:[step 414999] Saving checkpoints to /home/ubuntu/ckpt-master/0414999.params, /home/ubuntu/ckpt-master/0414999.states. INFO:root:[step 415249] mlm_loss=1.45820 mlm_acc=67.30852 nsp_loss=0.04160 nsp_acc=98.556 throughput=105.0K tks/s lr=0.0000585 time=122.53 INFO:root:[step 415499] mlm_loss=1.48717 mlm_acc=67.05105 nsp_loss=0.03887 nsp_acc=98.607 throughput=119.0K tks/s lr=0.0000585 time=107.67 INFO:root:[step 415749] mlm_loss=1.47614 mlm_acc=66.61346 nsp_loss=0.03972 nsp_acc=98.569 throughput=112.0K tks/s lr=0.0000584 time=115.53 INFO:root:[step 415999] mlm_loss=1.51330 mlm_acc=66.07073 nsp_loss=0.04310 nsp_acc=98.385 throughput=124.0K tks/s lr=0.0000584 time=110.05 INFO:root:[step 416249] mlm_loss=1.77018 mlm_acc=64.02553 nsp_loss=0.03405 nsp_acc=98.762 throughput=145.0K tks/s lr=0.0000584 time=142.52 INFO:root:[step 416499] mlm_loss=1.77226 mlm_acc=63.74846 nsp_loss=0.03117 nsp_acc=98.928 throughput=148.0K tks/s lr=0.0000584 time=146.36 INFO:root:[step 416749] mlm_loss=1.63633 mlm_acc=65.43181 nsp_loss=0.04068 nsp_acc=98.503 throughput=127.0K tks/s lr=0.0000583 time=129.15 INFO:root:[step 416999] mlm_loss=1.70153 mlm_acc=63.84211 nsp_loss=0.04853 nsp_acc=98.176 throughput=141.0K tks/s lr=0.0000583 time=137.13 INFO:root:[step 417249] mlm_loss=1.86455 mlm_acc=61.32585 nsp_loss=0.07942 nsp_acc=96.815 throughput=140.0K tks/s lr=0.0000583 time=144.56 INFO:root:[step 417499] mlm_loss=1.55610 mlm_acc=66.01647 nsp_loss=0.04143 nsp_acc=98.472 throughput=127.0K tks/s lr=0.0000583 time=109.58 INFO:root:[step 417749] mlm_loss=1.63526 mlm_acc=64.78617 nsp_loss=0.05009 nsp_acc=98.155 throughput=137.0K tks/s lr=0.0000582 time=134.15 INFO:root:[step 417999] mlm_loss=1.50428 mlm_acc=66.21851 nsp_loss=0.04977 nsp_acc=98.223 throughput=120.0K tks/s lr=0.0000582 time=126.22 INFO:root:[step 418249] mlm_loss=1.65460 mlm_acc=63.57192 nsp_loss=0.06703 nsp_acc=97.380 throughput=144.0K tks/s lr=0.0000582 time=126.86 INFO:root:[step 418499] mlm_loss=1.69553 mlm_acc=64.63885 nsp_loss=0.03671 nsp_acc=98.675 throughput=135.0K tks/s lr=0.0000582 time=136.68 INFO:root:[step 418749] mlm_loss=1.52712 mlm_acc=66.58091 nsp_loss=0.04451 nsp_acc=98.438 throughput=112.0K tks/s lr=0.0000581 time=114.39 INFO:root:[step 418999] mlm_loss=1.79434 mlm_acc=62.75602 nsp_loss=0.04603 nsp_acc=98.288 throughput=145.0K tks/s lr=0.0000581 time=143.96 INFO:root:[step 419249] mlm_loss=1.64213 mlm_acc=63.38843 nsp_loss=0.04489 nsp_acc=98.336 throughput=146.0K tks/s lr=0.0000581 time=126.53 INFO:root:[step 419499] mlm_loss=1.88408 mlm_acc=60.20864 nsp_loss=0.05675 nsp_acc=97.879 throughput=148.0K tks/s lr=0.0000581 time=164.65 INFO:root:[step 419749] mlm_loss=1.64277 mlm_acc=64.38188 nsp_loss=0.10390 nsp_acc=95.653 throughput=140.0K tks/s lr=0.0000580 time=121.41 INFO:root:[step 419999] mlm_loss=1.63337 mlm_acc=65.23005 nsp_loss=0.03805 nsp_acc=98.631 throughput=127.0K tks/s lr=0.0000580 time=126.03 INFO:root:[step 419999] Saving checkpoints to /home/ubuntu/ckpt-master/0419999.params, /home/ubuntu/ckpt-master/0419999.states. INFO:root:[step 420249] mlm_loss=1.65590 mlm_acc=65.06960 nsp_loss=0.04462 nsp_acc=98.349 throughput=121.0K tks/s lr=0.0000580 time=148.26 INFO:root:[step 420499] mlm_loss=1.55750 mlm_acc=64.22210 nsp_loss=0.08719 nsp_acc=96.609 throughput=137.0K tks/s lr=0.0000580 time=137.51 INFO:root:[step 420749] mlm_loss=1.47863 mlm_acc=64.57831 nsp_loss=0.06711 nsp_acc=97.571 throughput=132.0K tks/s lr=0.0000579 time=114.87 INFO:root:[step 420999] mlm_loss=1.59604 mlm_acc=64.94013 nsp_loss=0.04843 nsp_acc=98.286 throughput=123.0K tks/s lr=0.0000579 time=123.24 INFO:root:[step 421249] mlm_loss=1.85470 mlm_acc=61.60475 nsp_loss=0.05372 nsp_acc=97.950 throughput=157.0K tks/s lr=0.0000579 time=157.33 INFO:root:[step 421499] mlm_loss=1.37692 mlm_acc=70.55228 nsp_loss=0.06388 nsp_acc=97.626 throughput=144.0K tks/s lr=0.0000579 time=147.61 INFO:root:[step 421749] mlm_loss=1.77297 mlm_acc=64.22453 nsp_loss=0.03085 nsp_acc=98.852 throughput=144.0K tks/s lr=0.0000578 time=140.37 INFO:root:[step 421999] mlm_loss=1.78137 mlm_acc=62.70623 nsp_loss=0.06420 nsp_acc=97.501 throughput=152.0K tks/s lr=0.0000578 time=172.03 INFO:root:[step 422249] mlm_loss=1.61998 mlm_acc=65.12015 nsp_loss=0.06859 nsp_acc=97.366 throughput=143.0K tks/s lr=0.0000578 time=145.18 INFO:root:[step 422499] mlm_loss=1.55157 mlm_acc=66.48202 nsp_loss=0.03609 nsp_acc=98.672 throughput=130.0K tks/s lr=0.0000578 time=113.25 INFO:root:[step 422749] mlm_loss=1.33343 mlm_acc=72.32324 nsp_loss=0.05751 nsp_acc=97.974 throughput=145.0K tks/s lr=0.0000577 time=143.35 INFO:root:[step 422999] mlm_loss=1.75517 mlm_acc=64.12362 nsp_loss=0.05083 nsp_acc=98.057 throughput=141.0K tks/s lr=0.0000577 time=138.42 INFO:root:[step 423249] mlm_loss=1.60392 mlm_acc=64.66593 nsp_loss=0.04999 nsp_acc=98.113 throughput=126.0K tks/s lr=0.0000577 time=125.55 INFO:root:[step 423499] mlm_loss=1.47728 mlm_acc=66.96659 nsp_loss=0.04450 nsp_acc=98.375 throughput=119.0K tks/s lr=0.0000577 time=108.28 INFO:root:[step 423749] mlm_loss=1.63274 mlm_acc=65.46625 nsp_loss=0.03718 nsp_acc=98.638 throughput=135.0K tks/s lr=0.0000576 time=118.78 INFO:root:[step 423999] mlm_loss=1.61287 mlm_acc=63.85817 nsp_loss=0.06667 nsp_acc=97.389 throughput=130.0K tks/s lr=0.0000576 time=135.13 INFO:root:[step 424249] mlm_loss=1.50341 mlm_acc=66.52833 nsp_loss=0.04494 nsp_acc=98.368 throughput=117.0K tks/s lr=0.0000576 time=108.39 INFO:root:[step 424749] mlm_loss=3.18970 mlm_acc=65.59981 nsp_loss=0.08095 nsp_acc=98.550 throughput=128.0K tks/s lr=0.0000575 time=254.27 INFO:root:[step 424999] mlm_loss=1.53687 mlm_acc=66.33032 nsp_loss=0.04408 nsp_acc=98.426 throughput=123.0K tks/s lr=0.0000575 time=111.18 INFO:root:[step 424999] Saving checkpoints to /home/ubuntu/ckpt-master/0424999.params, /home/ubuntu/ckpt-master/0424999.states. INFO:root:[step 425249] mlm_loss=1.49302 mlm_acc=66.86784 nsp_loss=0.04097 nsp_acc=98.520 throughput=105.0K tks/s lr=0.0000575 time=125.04 INFO:root:[step 425499] mlm_loss=1.60278 mlm_acc=64.91991 nsp_loss=0.04098 nsp_acc=98.566 throughput=131.0K tks/s lr=0.0000575 time=129.37 INFO:root:[step 425749] mlm_loss=1.67469 mlm_acc=64.99902 nsp_loss=0.03880 nsp_acc=98.592 throughput=137.0K tks/s lr=0.0000574 time=132.96 INFO:root:[step 425999] mlm_loss=1.68190 mlm_acc=64.80346 nsp_loss=0.07985 nsp_acc=96.798 throughput=143.0K tks/s lr=0.0000574 time=143.07 INFO:root:[step 426249] mlm_loss=1.69133 mlm_acc=65.25438 nsp_loss=0.03540 nsp_acc=98.694 throughput=136.0K tks/s lr=0.0000574 time=135.20 INFO:root:[step 426499] mlm_loss=1.72462 mlm_acc=64.16488 nsp_loss=0.04780 nsp_acc=98.169 throughput=144.0K tks/s lr=0.0000574 time=138.01 INFO:root:[step 426749] mlm_loss=1.72873 mlm_acc=64.23805 nsp_loss=0.04382 nsp_acc=98.305 throughput=141.0K tks/s lr=0.0000573 time=142.55 INFO:root:[step 426999] mlm_loss=1.54034 mlm_acc=66.24862 nsp_loss=0.04488 nsp_acc=98.341 throughput=125.0K tks/s lr=0.0000573 time=113.13 INFO:root:[step 427249] mlm_loss=1.67823 mlm_acc=65.12708 nsp_loss=0.03773 nsp_acc=98.640 throughput=133.0K tks/s lr=0.0000573 time=131.36 INFO:root:[step 427499] mlm_loss=1.73308 mlm_acc=64.92544 nsp_loss=0.03584 nsp_acc=98.730 throughput=138.0K tks/s lr=0.0000573 time=134.31 INFO:root:[step 427749] mlm_loss=1.61299 mlm_acc=65.81178 nsp_loss=0.03605 nsp_acc=98.663 throughput=135.0K tks/s lr=0.0000572 time=117.72 INFO:root:[step 427999] mlm_loss=1.64141 mlm_acc=64.51014 nsp_loss=0.06248 nsp_acc=97.554 throughput=143.0K tks/s lr=0.0000572 time=139.41 INFO:root:[step 428249] mlm_loss=1.83800 mlm_acc=61.66015 nsp_loss=0.08828 nsp_acc=96.486 throughput=153.0K tks/s lr=0.0000572 time=168.45 INFO:root:[step 428499] mlm_loss=1.78055 mlm_acc=64.26084 nsp_loss=0.03691 nsp_acc=98.612 throughput=144.0K tks/s lr=0.0000572 time=137.09 INFO:root:[step 428749] mlm_loss=1.74669 mlm_acc=64.46725 nsp_loss=0.03440 nsp_acc=98.768 throughput=141.0K tks/s lr=0.0000571 time=141.05 INFO:root:[step 428999] mlm_loss=1.76158 mlm_acc=64.39253 nsp_loss=0.03138 nsp_acc=98.864 throughput=144.0K tks/s lr=0.0000571 time=138.72 INFO:root:[step 429249] mlm_loss=1.79573 mlm_acc=63.36433 nsp_loss=0.06298 nsp_acc=97.421 throughput=150.0K tks/s lr=0.0000571 time=148.48 INFO:root:[step 429499] mlm_loss=1.46799 mlm_acc=66.68692 nsp_loss=0.04544 nsp_acc=98.329 throughput=124.0K tks/s lr=0.0000571 time=110.78 INFO:root:[step 429749] mlm_loss=1.78433 mlm_acc=63.84173 nsp_loss=0.03140 nsp_acc=98.872 throughput=145.0K tks/s lr=0.0000570 time=152.86 INFO:root:[step 429999] mlm_loss=1.82555 mlm_acc=62.23851 nsp_loss=0.07632 nsp_acc=96.987 throughput=157.0K tks/s lr=0.0000570 time=161.09 INFO:root:[step 429999] Saving checkpoints to /home/ubuntu/ckpt-master/0429999.params, /home/ubuntu/ckpt-master/0429999.states. INFO:root:[step 430249] mlm_loss=1.57596 mlm_acc=65.55399 nsp_loss=0.05442 nsp_acc=97.973 throughput=110.0K tks/s lr=0.0000570 time=142.04 INFO:root:[step 430499] mlm_loss=1.57913 mlm_acc=66.19937 nsp_loss=0.03675 nsp_acc=98.676 throughput=134.0K tks/s lr=0.0000570 time=115.62 INFO:root:[step 430749] mlm_loss=1.49444 mlm_acc=67.00734 nsp_loss=0.03979 nsp_acc=98.641 throughput=110.0K tks/s lr=0.0000569 time=118.84 INFO:root:[step 430999] mlm_loss=1.52908 mlm_acc=65.62689 nsp_loss=0.05585 nsp_acc=97.838 throughput=138.0K tks/s lr=0.0000569 time=118.48 INFO:root:[step 431249] mlm_loss=1.70800 mlm_acc=63.80310 nsp_loss=0.10752 nsp_acc=95.378 throughput=144.0K tks/s lr=0.0000569 time=145.50 INFO:root:[step 431499] mlm_loss=1.68785 mlm_acc=65.13975 nsp_loss=0.03388 nsp_acc=98.761 throughput=130.0K tks/s lr=0.0000569 time=130.72 INFO:root:[step 431749] mlm_loss=1.52853 mlm_acc=66.69451 nsp_loss=0.04139 nsp_acc=98.537 throughput=120.0K tks/s lr=0.0000568 time=110.18 INFO:root:[step 431999] mlm_loss=1.68723 mlm_acc=65.11400 nsp_loss=0.03722 nsp_acc=98.670 throughput=137.0K tks/s lr=0.0000568 time=130.97 INFO:root:[step 432249] mlm_loss=1.91701 mlm_acc=61.25233 nsp_loss=0.06104 nsp_acc=97.644 throughput=156.0K tks/s lr=0.0000568 time=158.11 INFO:root:[step 432499] mlm_loss=1.67492 mlm_acc=64.81482 nsp_loss=0.04071 nsp_acc=98.516 throughput=132.0K tks/s lr=0.0000568 time=128.62 INFO:root:[step 432749] mlm_loss=1.65911 mlm_acc=64.92541 nsp_loss=0.03650 nsp_acc=98.658 throughput=135.0K tks/s lr=0.0000567 time=132.44 INFO:root:[step 432999] mlm_loss=1.58622 mlm_acc=65.96743 nsp_loss=0.03769 nsp_acc=98.607 throughput=131.0K tks/s lr=0.0000567 time=113.64 INFO:root:[step 433249] mlm_loss=1.72451 mlm_acc=64.79187 nsp_loss=0.03575 nsp_acc=98.711 throughput=140.0K tks/s lr=0.0000567 time=136.95 INFO:root:[step 433499] mlm_loss=1.71023 mlm_acc=64.07112 nsp_loss=0.05521 nsp_acc=97.893 throughput=147.0K tks/s lr=0.0000567 time=146.53 INFO:root:[step 433749] mlm_loss=1.43651 mlm_acc=67.40247 nsp_loss=0.04433 nsp_acc=98.444 throughput=110.0K tks/s lr=0.0000566 time=117.54 INFO:root:[step 433999] mlm_loss=1.57265 mlm_acc=65.77780 nsp_loss=0.04205 nsp_acc=98.483 throughput=130.0K tks/s lr=0.0000566 time=114.32 INFO:root:[step 434249] mlm_loss=1.67893 mlm_acc=64.95320 nsp_loss=0.03386 nsp_acc=98.750 throughput=134.0K tks/s lr=0.0000566 time=134.25 INFO:root:[step 434499] mlm_loss=1.48303 mlm_acc=66.82329 nsp_loss=0.05184 nsp_acc=98.057 throughput=111.0K tks/s lr=0.0000566 time=106.33 INFO:root:[step 434749] mlm_loss=1.52640 mlm_acc=66.17705 nsp_loss=0.04366 nsp_acc=98.379 throughput=115.0K tks/s lr=0.0000565 time=119.00 INFO:root:[step 434999] mlm_loss=1.51332 mlm_acc=66.72316 nsp_loss=0.03902 nsp_acc=98.612 throughput=122.0K tks/s lr=0.0000565 time=109.90 INFO:root:[step 434999] Saving checkpoints to /home/ubuntu/ckpt-master/0434999.params, /home/ubuntu/ckpt-master/0434999.states. INFO:root:[step 435249] mlm_loss=1.47772 mlm_acc=67.28360 nsp_loss=0.04054 nsp_acc=98.567 throughput=100.0K tks/s lr=0.0000565 time=120.68 INFO:root:[step 435499] mlm_loss=1.58984 mlm_acc=64.53629 nsp_loss=0.07274 nsp_acc=97.148 throughput=135.0K tks/s lr=0.0000565 time=137.04 INFO:root:[step 435749] mlm_loss=1.43645 mlm_acc=67.49016 nsp_loss=0.04246 nsp_acc=98.533 throughput=115.0K tks/s lr=0.0000564 time=106.49 INFO:root:[step 435999] mlm_loss=1.53398 mlm_acc=66.40049 nsp_loss=0.04190 nsp_acc=98.529 throughput=123.0K tks/s lr=0.0000564 time=110.35 INFO:root:[step 436249] mlm_loss=1.46077 mlm_acc=67.38096 nsp_loss=0.04114 nsp_acc=98.537 throughput=110.0K tks/s lr=0.0000564 time=115.56 INFO:root:[step 436499] mlm_loss=1.53950 mlm_acc=66.53365 nsp_loss=0.04159 nsp_acc=98.481 throughput=121.0K tks/s lr=0.0000564 time=111.03 INFO:root:[step 436749] mlm_loss=1.48319 mlm_acc=67.14824 nsp_loss=0.04309 nsp_acc=98.437 throughput=117.0K tks/s lr=0.0000563 time=105.44 INFO:root:[step 436999] mlm_loss=1.95172 mlm_acc=60.72308 nsp_loss=0.07808 nsp_acc=96.892 throughput=126.0K tks/s lr=0.0000563 time=129.47 INFO:root:[step 437249] mlm_loss=1.76309 mlm_acc=62.93749 nsp_loss=0.06538 nsp_acc=97.445 throughput=144.0K tks/s lr=0.0000563 time=146.60 INFO:root:[step 437499] mlm_loss=1.68146 mlm_acc=64.50987 nsp_loss=0.07891 nsp_acc=96.774 throughput=140.0K tks/s lr=0.0000563 time=137.84 INFO:root:[step 437749] mlm_loss=1.67754 mlm_acc=65.11349 nsp_loss=0.03690 nsp_acc=98.654 throughput=138.0K tks/s lr=0.0000562 time=121.65 INFO:root:[step 437999] mlm_loss=1.71471 mlm_acc=64.24689 nsp_loss=0.08218 nsp_acc=96.601 throughput=136.0K tks/s lr=0.0000562 time=133.64 INFO:root:[step 438249] mlm_loss=1.63623 mlm_acc=65.29802 nsp_loss=0.05880 nsp_acc=97.622 throughput=129.0K tks/s lr=0.0000562 time=129.47 INFO:root:[step 438499] mlm_loss=1.67802 mlm_acc=64.83664 nsp_loss=0.03362 nsp_acc=98.773 throughput=134.0K tks/s lr=0.0000562 time=131.79 INFO:root:[step 438749] mlm_loss=1.76256 mlm_acc=63.39323 nsp_loss=0.05990 nsp_acc=97.686 throughput=147.0K tks/s lr=0.0000561 time=142.22 INFO:root:[step 438999] mlm_loss=1.79252 mlm_acc=62.65099 nsp_loss=0.07188 nsp_acc=97.096 throughput=155.0K tks/s lr=0.0000561 time=161.73 INFO:root:[step 439249] mlm_loss=1.59969 mlm_acc=65.81893 nsp_loss=0.04175 nsp_acc=98.484 throughput=131.0K tks/s lr=0.0000561 time=113.79 INFO:root:[step 439499] mlm_loss=1.85317 mlm_acc=62.38438 nsp_loss=0.05897 nsp_acc=97.648 throughput=138.0K tks/s lr=0.0000561 time=144.64 INFO:root:[step 439749] mlm_loss=1.74182 mlm_acc=64.54840 nsp_loss=0.03426 nsp_acc=98.722 throughput=140.0K tks/s lr=0.0000560 time=142.28 INFO:root:[step 439999] mlm_loss=1.56589 mlm_acc=65.13248 nsp_loss=0.06721 nsp_acc=97.349 throughput=135.0K tks/s lr=0.0000560 time=114.85 INFO:root:[step 439999] Saving checkpoints to /home/ubuntu/ckpt-master/0439999.params, /home/ubuntu/ckpt-master/0439999.states. INFO:root:[step 440249] mlm_loss=1.68258 mlm_acc=64.14726 nsp_loss=0.05229 nsp_acc=97.950 throughput=124.0K tks/s lr=0.0000560 time=153.83 INFO:root:[step 440499] mlm_loss=1.65957 mlm_acc=64.87795 nsp_loss=0.03583 nsp_acc=98.706 throughput=135.0K tks/s lr=0.0000560 time=133.15 INFO:root:[step 440749] mlm_loss=1.65950 mlm_acc=64.54300 nsp_loss=0.07298 nsp_acc=97.128 throughput=142.0K tks/s lr=0.0000559 time=143.48 INFO:root:[step 440999] mlm_loss=1.56003 mlm_acc=66.04035 nsp_loss=0.04143 nsp_acc=98.517 throughput=127.0K tks/s lr=0.0000559 time=114.79 INFO:root:[step 441249] mlm_loss=1.78622 mlm_acc=62.85181 nsp_loss=0.04398 nsp_acc=98.410 throughput=146.0K tks/s lr=0.0000559 time=145.38 INFO:root:[step 441499] mlm_loss=1.53448 mlm_acc=66.15433 nsp_loss=0.04446 nsp_acc=98.401 throughput=119.0K tks/s lr=0.0000559 time=120.91 INFO:root:[step 441749] mlm_loss=1.61035 mlm_acc=65.66730 nsp_loss=0.03852 nsp_acc=98.633 throughput=134.0K tks/s lr=0.0000558 time=118.80 INFO:root:[step 441999] mlm_loss=1.42335 mlm_acc=67.42454 nsp_loss=0.04365 nsp_acc=98.415 throughput=111.0K tks/s lr=0.0000558 time=114.19 INFO:root:[step 442249] mlm_loss=1.75092 mlm_acc=64.27726 nsp_loss=0.04924 nsp_acc=98.127 throughput=144.0K tks/s lr=0.0000558 time=140.86 INFO:root:[step 442499] mlm_loss=1.67797 mlm_acc=64.69224 nsp_loss=0.08504 nsp_acc=96.418 throughput=138.0K tks/s lr=0.0000558 time=138.09 INFO:root:[step 442749] mlm_loss=1.56086 mlm_acc=66.33393 nsp_loss=0.03995 nsp_acc=98.577 throughput=128.0K tks/s lr=0.0000557 time=115.83 INFO:root:[step 442999] mlm_loss=1.47582 mlm_acc=67.00106 nsp_loss=0.04192 nsp_acc=98.477 throughput=123.0K tks/s lr=0.0000557 time=110.82 INFO:root:[step 443249] mlm_loss=1.58265 mlm_acc=65.80908 nsp_loss=0.03639 nsp_acc=98.681 throughput=125.0K tks/s lr=0.0000557 time=124.90 INFO:root:[step 443499] mlm_loss=1.58355 mlm_acc=65.64832 nsp_loss=0.03608 nsp_acc=98.747 throughput=125.0K tks/s lr=0.0000557 time=127.85 INFO:root:[step 443749] mlm_loss=1.58214 mlm_acc=64.64274 nsp_loss=0.05735 nsp_acc=97.893 throughput=143.0K tks/s lr=0.0000556 time=126.29 INFO:root:[step 443999] mlm_loss=1.70210 mlm_acc=65.23413 nsp_loss=0.03484 nsp_acc=98.676 throughput=144.0K tks/s lr=0.0000556 time=154.91 INFO:root:[step 444249] mlm_loss=1.63678 mlm_acc=65.67048 nsp_loss=0.03852 nsp_acc=98.590 throughput=136.0K tks/s lr=0.0000556 time=120.45 INFO:root:[step 444499] mlm_loss=1.63835 mlm_acc=65.57850 nsp_loss=0.06274 nsp_acc=97.520 throughput=126.0K tks/s lr=0.0000556 time=124.56 INFO:root:[step 444749] mlm_loss=1.80001 mlm_acc=63.11567 nsp_loss=0.09226 nsp_acc=96.005 throughput=147.0K tks/s lr=0.0000555 time=148.04 INFO:root:[step 444999] mlm_loss=1.71310 mlm_acc=64.15611 nsp_loss=0.04096 nsp_acc=98.497 throughput=141.0K tks/s lr=0.0000555 time=143.24 INFO:root:[step 444999] Saving checkpoints to /home/ubuntu/ckpt-master/0444999.params, /home/ubuntu/ckpt-master/0444999.states. INFO:root:[step 445249] mlm_loss=1.63966 mlm_acc=64.52463 nsp_loss=0.07095 nsp_acc=97.259 throughput=130.0K tks/s lr=0.0000555 time=156.07 INFO:root:[step 445499] mlm_loss=1.72369 mlm_acc=64.82741 nsp_loss=0.03195 nsp_acc=98.823 throughput=147.0K tks/s lr=0.0000555 time=145.87 INFO:root:[step 445749] mlm_loss=1.64928 mlm_acc=65.06074 nsp_loss=0.03457 nsp_acc=98.748 throughput=133.0K tks/s lr=0.0000554 time=134.07 INFO:root:[step 445999] mlm_loss=1.60304 mlm_acc=65.72986 nsp_loss=0.03729 nsp_acc=98.660 throughput=128.0K tks/s lr=0.0000554 time=125.47 INFO:root:[step 446249] mlm_loss=1.50692 mlm_acc=66.65520 nsp_loss=0.04487 nsp_acc=98.369 throughput=124.0K tks/s lr=0.0000554 time=109.21 INFO:root:[step 446499] mlm_loss=1.51782 mlm_acc=67.03910 nsp_loss=0.04049 nsp_acc=98.507 throughput=125.0K tks/s lr=0.0000554 time=110.53 INFO:root:[step 446749] mlm_loss=1.60772 mlm_acc=65.98234 nsp_loss=0.04072 nsp_acc=98.550 throughput=121.0K tks/s lr=0.0000553 time=123.88 INFO:root:[step 446999] mlm_loss=1.49782 mlm_acc=66.99958 nsp_loss=0.04313 nsp_acc=98.464 throughput=120.0K tks/s lr=0.0000553 time=107.26 INFO:root:[step 447249] mlm_loss=1.48078 mlm_acc=67.08514 nsp_loss=0.03883 nsp_acc=98.674 throughput=125.0K tks/s lr=0.0000553 time=111.05 INFO:root:[step 447499] mlm_loss=1.79788 mlm_acc=62.67813 nsp_loss=0.06089 nsp_acc=97.588 throughput=147.0K tks/s lr=0.0000553 time=157.34 INFO:root:[step 447749] mlm_loss=1.68923 mlm_acc=64.03027 nsp_loss=0.04330 nsp_acc=98.365 throughput=142.0K tks/s lr=0.0000552 time=143.80 INFO:root:[step 447999] mlm_loss=1.70048 mlm_acc=65.21564 nsp_loss=0.03657 nsp_acc=98.657 throughput=139.0K tks/s lr=0.0000552 time=133.07 INFO:root:[step 448249] mlm_loss=1.72946 mlm_acc=62.42804 nsp_loss=0.11983 nsp_acc=94.896 throughput=149.0K tks/s lr=0.0000552 time=161.07 INFO:root:[step 448499] mlm_loss=1.58437 mlm_acc=63.57388 nsp_loss=0.08730 nsp_acc=96.588 throughput=132.0K tks/s lr=0.0000552 time=116.27 INFO:root:[step 448749] mlm_loss=1.67306 mlm_acc=64.52539 nsp_loss=0.04607 nsp_acc=98.212 throughput=128.0K tks/s lr=0.0000551 time=130.60 INFO:root:[step 448999] mlm_loss=1.46096 mlm_acc=66.94881 nsp_loss=0.04654 nsp_acc=98.319 throughput=116.0K tks/s lr=0.0000551 time=107.02 INFO:root:[step 449249] mlm_loss=1.73484 mlm_acc=63.83368 nsp_loss=0.05056 nsp_acc=97.993 throughput=142.0K tks/s lr=0.0000551 time=138.54 INFO:root:[step 449499] mlm_loss=1.80601 mlm_acc=62.82081 nsp_loss=0.05456 nsp_acc=97.804 throughput=145.0K tks/s lr=0.0000551 time=143.66 INFO:root:[step 449749] mlm_loss=1.60151 mlm_acc=64.96710 nsp_loss=0.04621 nsp_acc=98.275 throughput=121.0K tks/s lr=0.0000550 time=125.57 INFO:root:[step 449999] mlm_loss=1.72094 mlm_acc=63.21038 nsp_loss=0.07490 nsp_acc=97.084 throughput=141.0K tks/s lr=0.0000550 time=133.50 INFO:root:[step 449999] Saving checkpoints to /home/ubuntu/ckpt-master/0449999.params, /home/ubuntu/ckpt-master/0449999.states. INFO:root:[step 450249] mlm_loss=1.70806 mlm_acc=63.17753 nsp_loss=0.04807 nsp_acc=98.228 throughput=129.0K tks/s lr=0.0000550 time=155.46 INFO:root:[step 450499] mlm_loss=1.72520 mlm_acc=64.01296 nsp_loss=0.05582 nsp_acc=97.856 throughput=152.0K tks/s lr=0.0000550 time=154.80 INFO:root:[step 450749] mlm_loss=1.65717 mlm_acc=65.66489 nsp_loss=0.03612 nsp_acc=98.669 throughput=131.0K tks/s lr=0.0000549 time=130.26 INFO:root:[step 450999] mlm_loss=1.56915 mlm_acc=66.41288 nsp_loss=0.03923 nsp_acc=98.542 throughput=133.0K tks/s lr=0.0000549 time=116.64 INFO:root:[step 451249] mlm_loss=1.59466 mlm_acc=65.38935 nsp_loss=0.03963 nsp_acc=98.548 throughput=135.0K tks/s lr=0.0000549 time=133.40 INFO:root:[step 451499] mlm_loss=1.50176 mlm_acc=66.87928 nsp_loss=0.04489 nsp_acc=98.441 throughput=129.0K tks/s lr=0.0000549 time=112.62 INFO:root:[step 451749] mlm_loss=1.53750 mlm_acc=65.79696 nsp_loss=0.05066 nsp_acc=98.139 throughput=126.0K tks/s lr=0.0000548 time=125.42 INFO:root:[step 451999] mlm_loss=1.72875 mlm_acc=64.19084 nsp_loss=0.04886 nsp_acc=98.153 throughput=145.0K tks/s lr=0.0000548 time=144.79 INFO:root:[step 452249] mlm_loss=1.58608 mlm_acc=65.43103 nsp_loss=0.04865 nsp_acc=98.156 throughput=131.0K tks/s lr=0.0000548 time=127.40 INFO:root:[step 452499] mlm_loss=1.71064 mlm_acc=63.81036 nsp_loss=0.07441 nsp_acc=97.009 throughput=145.0K tks/s lr=0.0000548 time=147.30 INFO:root:[step 452749] mlm_loss=1.58252 mlm_acc=66.02007 nsp_loss=0.04339 nsp_acc=98.427 throughput=130.0K tks/s lr=0.0000547 time=114.79 INFO:root:[step 453249] mlm_loss=3.29584 mlm_acc=65.45850 nsp_loss=0.07119 nsp_acc=98.719 throughput=133.0K tks/s lr=0.0000547 time=261.88 INFO:root:[step 453499] mlm_loss=1.54277 mlm_acc=65.32246 nsp_loss=0.06615 nsp_acc=97.461 throughput=145.0K tks/s lr=0.0000547 time=139.45 INFO:root:[step 453749] mlm_loss=1.65447 mlm_acc=65.15859 nsp_loss=0.03575 nsp_acc=98.692 throughput=130.0K tks/s lr=0.0000546 time=139.21 INFO:root:[step 453999] mlm_loss=1.47772 mlm_acc=67.18688 nsp_loss=0.04188 nsp_acc=98.543 throughput=118.0K tks/s lr=0.0000546 time=108.16 INFO:root:[step 454249] mlm_loss=1.65272 mlm_acc=65.05674 nsp_loss=0.03374 nsp_acc=98.764 throughput=139.0K tks/s lr=0.0000546 time=132.40 INFO:root:[step 454499] mlm_loss=1.97763 mlm_acc=61.02319 nsp_loss=0.07426 nsp_acc=97.039 throughput=144.0K tks/s lr=0.0000546 time=140.41 INFO:root:[step 454749] mlm_loss=1.78440 mlm_acc=63.26582 nsp_loss=0.04368 nsp_acc=98.368 throughput=152.0K tks/s lr=0.0000545 time=153.67 INFO:root:[step 454999] mlm_loss=1.69872 mlm_acc=62.63216 nsp_loss=0.07316 nsp_acc=97.065 throughput=136.0K tks/s lr=0.0000545 time=139.95 INFO:root:[step 454999] Saving checkpoints to /home/ubuntu/ckpt-master/0454999.params, /home/ubuntu/ckpt-master/0454999.states. INFO:root:[step 455249] mlm_loss=1.50827 mlm_acc=66.83402 nsp_loss=0.04302 nsp_acc=98.462 throughput=106.0K tks/s lr=0.0000545 time=125.28 INFO:root:[step 455499] mlm_loss=1.64426 mlm_acc=65.32321 nsp_loss=0.03873 nsp_acc=98.546 throughput=133.0K tks/s lr=0.0000545 time=129.55 INFO:root:[step 455749] mlm_loss=1.48755 mlm_acc=67.14944 nsp_loss=0.04253 nsp_acc=98.453 throughput=121.0K tks/s lr=0.0000544 time=110.42 INFO:root:[step 455999] mlm_loss=1.73694 mlm_acc=63.37102 nsp_loss=0.09316 nsp_acc=96.296 throughput=147.0K tks/s lr=0.0000544 time=165.76 INFO:root:[step 456249] mlm_loss=1.65109 mlm_acc=64.89856 nsp_loss=0.03705 nsp_acc=98.681 throughput=135.0K tks/s lr=0.0000544 time=128.58 INFO:root:[step 456499] mlm_loss=1.59249 mlm_acc=65.43954 nsp_loss=0.04172 nsp_acc=98.502 throughput=132.0K tks/s lr=0.0000544 time=123.98 INFO:root:[step 456749] mlm_loss=1.60200 mlm_acc=64.91271 nsp_loss=0.12367 nsp_acc=94.697 throughput=126.0K tks/s lr=0.0000543 time=132.13 INFO:root:[step 456999] mlm_loss=1.59337 mlm_acc=65.36865 nsp_loss=0.03846 nsp_acc=98.621 throughput=140.0K tks/s lr=0.0000543 time=118.37 INFO:root:[step 457249] mlm_loss=1.35413 mlm_acc=67.79788 nsp_loss=0.04962 nsp_acc=98.231 throughput=106.0K tks/s lr=0.0000543 time=113.35 INFO:root:[step 457499] mlm_loss=1.66574 mlm_acc=64.80219 nsp_loss=0.04176 nsp_acc=98.441 throughput=141.0K tks/s lr=0.0000543 time=134.72 INFO:root:[step 457749] mlm_loss=1.57705 mlm_acc=65.42222 nsp_loss=0.08133 nsp_acc=96.725 throughput=135.0K tks/s lr=0.0000542 time=123.01 INFO:root:[step 457999] mlm_loss=1.67731 mlm_acc=65.23109 nsp_loss=0.03735 nsp_acc=98.660 throughput=134.0K tks/s lr=0.0000542 time=129.63 INFO:root:[step 458249] mlm_loss=1.62527 mlm_acc=65.61440 nsp_loss=0.04005 nsp_acc=98.562 throughput=125.0K tks/s lr=0.0000542 time=127.25 INFO:root:[step 458499] mlm_loss=1.54587 mlm_acc=66.22471 nsp_loss=0.04197 nsp_acc=98.491 throughput=133.0K tks/s lr=0.0000542 time=113.55 INFO:root:[step 458749] mlm_loss=1.88095 mlm_acc=61.58819 nsp_loss=0.08452 nsp_acc=96.548 throughput=136.0K tks/s lr=0.0000541 time=136.75 INFO:root:[step 458999] mlm_loss=1.48342 mlm_acc=67.09557 nsp_loss=0.04484 nsp_acc=98.410 throughput=124.0K tks/s lr=0.0000541 time=110.46 INFO:root:[step 459249] mlm_loss=1.81735 mlm_acc=62.56817 nsp_loss=0.04436 nsp_acc=98.317 throughput=148.0K tks/s lr=0.0000541 time=160.05 INFO:root:[step 459499] mlm_loss=1.66444 mlm_acc=65.29722 nsp_loss=0.02479 nsp_acc=99.109 throughput=141.0K tks/s lr=0.0000541 time=134.16 INFO:root:[step 459749] mlm_loss=1.70633 mlm_acc=64.87708 nsp_loss=0.02463 nsp_acc=99.108 throughput=144.0K tks/s lr=0.0000540 time=139.03 INFO:root:[step 459999] mlm_loss=1.61955 mlm_acc=66.22615 nsp_loss=0.02791 nsp_acc=99.035 throughput=138.0K tks/s lr=0.0000540 time=139.16 INFO:root:[step 459999] Saving checkpoints to /home/ubuntu/ckpt-master/0459999.params, /home/ubuntu/ckpt-master/0459999.states. INFO:root:[step 460249] mlm_loss=1.57973 mlm_acc=65.13035 nsp_loss=0.04054 nsp_acc=98.466 throughput=125.0K tks/s lr=0.0000540 time=153.25 INFO:root:[step 460499] mlm_loss=1.46567 mlm_acc=67.40407 nsp_loss=0.03420 nsp_acc=98.781 throughput=119.0K tks/s lr=0.0000540 time=109.09 INFO:root:[step 460749] mlm_loss=1.51828 mlm_acc=67.03535 nsp_loss=0.03175 nsp_acc=98.905 throughput=132.0K tks/s lr=0.0000539 time=113.31 INFO:root:[step 460999] mlm_loss=1.68764 mlm_acc=64.24635 nsp_loss=0.05427 nsp_acc=97.932 throughput=140.0K tks/s lr=0.0000539 time=158.10 INFO:root:[step 461249] mlm_loss=1.41360 mlm_acc=67.47634 nsp_loss=0.03690 nsp_acc=98.746 throughput=119.0K tks/s lr=0.0000539 time=106.60 INFO:root:[step 461499] mlm_loss=1.64585 mlm_acc=63.84555 nsp_loss=0.06111 nsp_acc=97.695 throughput=139.0K tks/s lr=0.0000539 time=139.49 INFO:root:[step 461749] mlm_loss=1.62321 mlm_acc=63.24529 nsp_loss=0.04485 nsp_acc=98.289 throughput=137.0K tks/s lr=0.0000538 time=134.42 INFO:root:[step 461999] mlm_loss=1.47681 mlm_acc=66.55974 nsp_loss=0.03011 nsp_acc=98.937 throughput=135.0K tks/s lr=0.0000538 time=113.74 INFO:root:[step 462249] mlm_loss=1.73654 mlm_acc=63.21069 nsp_loss=0.06179 nsp_acc=97.556 throughput=153.0K tks/s lr=0.0000538 time=172.61 INFO:root:[step 462499] mlm_loss=1.53928 mlm_acc=65.66862 nsp_loss=0.05548 nsp_acc=97.895 throughput=144.0K tks/s lr=0.0000538 time=129.15 INFO:root:[step 462749] mlm_loss=1.64946 mlm_acc=65.33786 nsp_loss=0.03678 nsp_acc=98.683 throughput=131.0K tks/s lr=0.0000537 time=130.09 INFO:root:[step 462999] mlm_loss=1.55531 mlm_acc=66.51361 nsp_loss=0.03177 nsp_acc=98.889 throughput=126.0K tks/s lr=0.0000537 time=124.02 INFO:root:[step 463249] mlm_loss=1.53269 mlm_acc=66.93718 nsp_loss=0.03490 nsp_acc=98.721 throughput=131.0K tks/s lr=0.0000537 time=117.32 INFO:root:[step 463499] mlm_loss=1.64508 mlm_acc=64.80758 nsp_loss=0.02925 nsp_acc=98.977 throughput=137.0K tks/s lr=0.0000537 time=136.46 INFO:root:[step 463749] mlm_loss=1.55062 mlm_acc=66.27136 nsp_loss=0.03397 nsp_acc=98.830 throughput=122.0K tks/s lr=0.0000536 time=122.07 INFO:root:[step 463999] mlm_loss=1.71456 mlm_acc=63.83828 nsp_loss=0.08452 nsp_acc=96.484 throughput=140.0K tks/s lr=0.0000536 time=144.23 INFO:root:[step 464249] mlm_loss=1.46791 mlm_acc=67.27363 nsp_loss=0.03579 nsp_acc=98.750 throughput=124.0K tks/s lr=0.0000536 time=109.88 INFO:root:[step 464499] mlm_loss=1.60336 mlm_acc=65.72141 nsp_loss=0.02749 nsp_acc=99.041 throughput=133.0K tks/s lr=0.0000536 time=128.63 INFO:root:[step 464749] mlm_loss=1.70950 mlm_acc=63.49382 nsp_loss=0.05885 nsp_acc=97.689 throughput=140.0K tks/s lr=0.0000535 time=140.29 INFO:root:[step 464999] mlm_loss=1.57665 mlm_acc=66.24211 nsp_loss=0.03350 nsp_acc=98.811 throughput=135.0K tks/s lr=0.0000535 time=116.96 INFO:root:[step 464999] Saving checkpoints to /home/ubuntu/ckpt-master/0464999.params, /home/ubuntu/ckpt-master/0464999.states. INFO:root:[step 465249] mlm_loss=1.80605 mlm_acc=62.90869 nsp_loss=0.05132 nsp_acc=98.045 throughput=136.0K tks/s lr=0.0000535 time=171.98 INFO:root:[step 465499] mlm_loss=1.73841 mlm_acc=62.68601 nsp_loss=0.06648 nsp_acc=97.379 throughput=154.0K tks/s lr=0.0000535 time=163.62 INFO:root:[step 465749] mlm_loss=1.48608 mlm_acc=66.90297 nsp_loss=0.03944 nsp_acc=98.593 throughput=124.0K tks/s lr=0.0000534 time=109.72 INFO:root:[step 465999] mlm_loss=1.44676 mlm_acc=67.45502 nsp_loss=0.03198 nsp_acc=98.896 throughput=113.0K tks/s lr=0.0000534 time=115.68 INFO:root:[step 466249] mlm_loss=1.68974 mlm_acc=65.18421 nsp_loss=0.02962 nsp_acc=98.949 throughput=147.0K tks/s lr=0.0000534 time=127.95 INFO:root:[step 466499] mlm_loss=1.60194 mlm_acc=65.84007 nsp_loss=0.03272 nsp_acc=98.852 throughput=124.0K tks/s lr=0.0000534 time=127.12 INFO:root:[step 466749] mlm_loss=1.55918 mlm_acc=65.18952 nsp_loss=0.05470 nsp_acc=97.900 throughput=139.0K tks/s lr=0.0000533 time=140.27 INFO:root:[step 466999] mlm_loss=1.56943 mlm_acc=66.20794 nsp_loss=0.03096 nsp_acc=98.944 throughput=134.0K tks/s lr=0.0000533 time=115.28 INFO:root:[step 467249] mlm_loss=1.71888 mlm_acc=64.67763 nsp_loss=0.02628 nsp_acc=99.082 throughput=135.0K tks/s lr=0.0000533 time=147.63 INFO:root:[step 467499] mlm_loss=1.46488 mlm_acc=66.90268 nsp_loss=0.04366 nsp_acc=98.427 throughput=119.0K tks/s lr=0.0000533 time=111.04 INFO:root:[step 467749] mlm_loss=1.38095 mlm_acc=67.55949 nsp_loss=0.04238 nsp_acc=98.502 throughput=119.0K tks/s lr=0.0000532 time=110.18 INFO:root:[step 467999] mlm_loss=1.62872 mlm_acc=65.77537 nsp_loss=0.03506 nsp_acc=98.725 throughput=130.0K tks/s lr=0.0000532 time=125.18 INFO:root:[step 468249] mlm_loss=1.51967 mlm_acc=66.49130 nsp_loss=0.03523 nsp_acc=98.742 throughput=129.0K tks/s lr=0.0000532 time=118.86 INFO:root:[step 468499] mlm_loss=1.46279 mlm_acc=67.30841 nsp_loss=0.03558 nsp_acc=98.744 throughput=114.0K tks/s lr=0.0000532 time=118.00 INFO:root:[step 468749] mlm_loss=1.45719 mlm_acc=67.71001 nsp_loss=0.03973 nsp_acc=98.617 throughput=116.0K tks/s lr=0.0000531 time=105.39 INFO:root:[step 468999] mlm_loss=1.47674 mlm_acc=67.14356 nsp_loss=0.03442 nsp_acc=98.787 throughput=126.0K tks/s lr=0.0000531 time=111.04 INFO:root:[step 469249] mlm_loss=1.53842 mlm_acc=66.50142 nsp_loss=0.03652 nsp_acc=98.747 throughput=115.0K tks/s lr=0.0000531 time=120.63 INFO:root:[step 469499] mlm_loss=1.63662 mlm_acc=65.66371 nsp_loss=0.03291 nsp_acc=98.820 throughput=139.0K tks/s lr=0.0000531 time=121.96 INFO:root:[step 469749] mlm_loss=1.45611 mlm_acc=67.51268 nsp_loss=0.03620 nsp_acc=98.698 throughput=116.0K tks/s lr=0.0000530 time=118.69 INFO:root:[step 469999] mlm_loss=1.53803 mlm_acc=66.75330 nsp_loss=0.02974 nsp_acc=98.975 throughput=129.0K tks/s lr=0.0000530 time=116.12 INFO:root:[step 469999] Saving checkpoints to /home/ubuntu/ckpt-master/0469999.params, /home/ubuntu/ckpt-master/0469999.states. INFO:root:[step 470249] mlm_loss=1.74673 mlm_acc=62.50500 nsp_loss=0.06859 nsp_acc=97.327 throughput=140.0K tks/s lr=0.0000530 time=183.82 INFO:root:[step 470499] mlm_loss=1.76248 mlm_acc=62.68397 nsp_loss=0.10016 nsp_acc=95.823 throughput=143.0K tks/s lr=0.0000530 time=147.38 INFO:root:[step 470749] mlm_loss=1.48179 mlm_acc=66.89540 nsp_loss=0.03208 nsp_acc=98.860 throughput=129.0K tks/s lr=0.0000529 time=112.02 INFO:root:[step 470999] mlm_loss=1.57287 mlm_acc=66.11358 nsp_loss=0.04044 nsp_acc=98.514 throughput=122.0K tks/s lr=0.0000529 time=118.15 INFO:root:[step 471249] mlm_loss=1.48184 mlm_acc=65.74226 nsp_loss=0.04980 nsp_acc=98.046 throughput=128.0K tks/s lr=0.0000529 time=120.50 INFO:root:[step 471499] mlm_loss=1.53804 mlm_acc=66.27775 nsp_loss=0.04300 nsp_acc=98.505 throughput=117.0K tks/s lr=0.0000529 time=119.11 INFO:root:[step 471749] mlm_loss=1.80182 mlm_acc=63.13175 nsp_loss=0.05530 nsp_acc=97.862 throughput=151.0K tks/s lr=0.0000528 time=149.01 INFO:root:[step 471999] mlm_loss=1.57474 mlm_acc=65.96711 nsp_loss=0.03267 nsp_acc=98.844 throughput=134.0K tks/s lr=0.0000528 time=119.29 INFO:root:[step 472249] mlm_loss=1.67274 mlm_acc=65.32539 nsp_loss=0.02793 nsp_acc=99.004 throughput=137.0K tks/s lr=0.0000528 time=134.97 INFO:root:[step 472499] mlm_loss=1.72403 mlm_acc=64.74304 nsp_loss=0.02441 nsp_acc=99.122 throughput=145.0K tks/s lr=0.0000528 time=144.77 INFO:root:[step 472749] mlm_loss=1.59772 mlm_acc=65.02690 nsp_loss=0.05265 nsp_acc=97.967 throughput=126.0K tks/s lr=0.0000527 time=125.94 INFO:root:[step 472999] mlm_loss=1.66627 mlm_acc=64.57624 nsp_loss=0.04189 nsp_acc=98.395 throughput=130.0K tks/s lr=0.0000527 time=132.40 INFO:root:[step 473249] mlm_loss=1.73411 mlm_acc=64.14385 nsp_loss=0.03334 nsp_acc=98.750 throughput=149.0K tks/s lr=0.0000527 time=145.50 INFO:root:[step 473499] mlm_loss=1.79085 mlm_acc=62.38304 nsp_loss=0.11276 nsp_acc=95.243 throughput=155.0K tks/s lr=0.0000527 time=157.99 INFO:root:[step 473749] mlm_loss=1.71659 mlm_acc=64.22488 nsp_loss=0.04660 nsp_acc=98.240 throughput=143.0K tks/s lr=0.0000526 time=141.20 INFO:root:[step 473999] mlm_loss=1.60481 mlm_acc=65.88580 nsp_loss=0.03639 nsp_acc=98.648 throughput=125.0K tks/s lr=0.0000526 time=124.56 INFO:root:[step 474249] mlm_loss=1.63417 mlm_acc=65.76623 nsp_loss=0.03335 nsp_acc=98.821 throughput=136.0K tks/s lr=0.0000526 time=118.65 INFO:root:[step 474499] mlm_loss=1.59234 mlm_acc=65.67866 nsp_loss=0.03445 nsp_acc=98.760 throughput=129.0K tks/s lr=0.0000526 time=129.28 INFO:root:[step 474749] mlm_loss=1.43852 mlm_acc=67.49453 nsp_loss=0.04071 nsp_acc=98.560 throughput=122.0K tks/s lr=0.0000525 time=108.96 INFO:root:[step 474999] mlm_loss=1.59436 mlm_acc=64.86091 nsp_loss=0.10942 nsp_acc=95.334 throughput=129.0K tks/s lr=0.0000525 time=131.54 INFO:root:[step 474999] Saving checkpoints to /home/ubuntu/ckpt-master/0474999.params, /home/ubuntu/ckpt-master/0474999.states. INFO:root:[step 475249] mlm_loss=1.54978 mlm_acc=66.54374 nsp_loss=0.03517 nsp_acc=98.738 throughput=110.0K tks/s lr=0.0000525 time=136.50 INFO:root:[step 475499] mlm_loss=1.47431 mlm_acc=67.11329 nsp_loss=0.03485 nsp_acc=98.779 throughput=125.0K tks/s lr=0.0000525 time=110.60 INFO:root:[step 475749] mlm_loss=1.69345 mlm_acc=63.14619 nsp_loss=0.05759 nsp_acc=97.759 throughput=133.0K tks/s lr=0.0000524 time=131.93 INFO:root:[step 475999] mlm_loss=1.59180 mlm_acc=65.28763 nsp_loss=0.03701 nsp_acc=98.690 throughput=139.0K tks/s lr=0.0000524 time=119.99 INFO:root:[step 476249] mlm_loss=1.66720 mlm_acc=64.84388 nsp_loss=0.03441 nsp_acc=98.759 throughput=138.0K tks/s lr=0.0000524 time=133.95 INFO:root:[step 476499] mlm_loss=1.62052 mlm_acc=65.76660 nsp_loss=0.03449 nsp_acc=98.724 throughput=124.0K tks/s lr=0.0000524 time=125.38 INFO:root:[step 476749] mlm_loss=1.69532 mlm_acc=63.38494 nsp_loss=0.07154 nsp_acc=97.274 throughput=153.0K tks/s lr=0.0000523 time=147.89 INFO:root:[step 476999] mlm_loss=1.45952 mlm_acc=65.50266 nsp_loss=0.04598 nsp_acc=98.377 throughput=131.0K tks/s lr=0.0000523 time=119.33 INFO:root:[step 477249] mlm_loss=1.60130 mlm_acc=64.31029 nsp_loss=0.03920 nsp_acc=98.592 throughput=134.0K tks/s lr=0.0000523 time=131.96 INFO:root:[step 477499] mlm_loss=1.75103 mlm_acc=62.68786 nsp_loss=0.05649 nsp_acc=97.782 throughput=141.0K tks/s lr=0.0000523 time=141.74 INFO:root:[step 477749] mlm_loss=1.46430 mlm_acc=67.03937 nsp_loss=0.03952 nsp_acc=98.631 throughput=117.0K tks/s lr=0.0000522 time=108.41 INFO:root:[step 477999] mlm_loss=1.61841 mlm_acc=66.40197 nsp_loss=0.03173 nsp_acc=98.902 throughput=141.0K tks/s lr=0.0000522 time=138.98 INFO:root:[step 478249] mlm_loss=1.59802 mlm_acc=64.64932 nsp_loss=0.06090 nsp_acc=97.616 throughput=136.0K tks/s lr=0.0000522 time=138.60 INFO:root:[step 478499] mlm_loss=1.41736 mlm_acc=67.73979 nsp_loss=0.03954 nsp_acc=98.633 throughput=119.0K tks/s lr=0.0000522 time=106.09 INFO:root:[step 478749] mlm_loss=1.53863 mlm_acc=66.48544 nsp_loss=0.04031 nsp_acc=98.535 throughput=119.0K tks/s lr=0.0000521 time=121.74 INFO:root:[step 478999] mlm_loss=1.40338 mlm_acc=67.57171 nsp_loss=0.04106 nsp_acc=98.518 throughput=115.0K tks/s lr=0.0000521 time=108.29 INFO:root:[step 479249] mlm_loss=1.64521 mlm_acc=63.80509 nsp_loss=0.04491 nsp_acc=98.299 throughput=137.0K tks/s lr=0.0000521 time=139.40 INFO:root:[step 479499] mlm_loss=1.46770 mlm_acc=67.25534 nsp_loss=0.03642 nsp_acc=98.691 throughput=129.0K tks/s lr=0.0000521 time=114.71 INFO:root:[step 479749] mlm_loss=1.55609 mlm_acc=65.35008 nsp_loss=0.06037 nsp_acc=97.711 throughput=129.0K tks/s lr=0.0000520 time=129.85 INFO:root:[step 479999] mlm_loss=1.61241 mlm_acc=64.80417 nsp_loss=0.05043 nsp_acc=98.096 throughput=138.0K tks/s lr=0.0000520 time=140.75 INFO:root:[step 479999] Saving checkpoints to /home/ubuntu/ckpt-master/0479999.params, /home/ubuntu/ckpt-master/0479999.states. INFO:root:[step 480249] mlm_loss=1.73352 mlm_acc=62.15784 nsp_loss=0.07073 nsp_acc=97.193 throughput=129.0K tks/s lr=0.0000520 time=154.78 INFO:root:[step 480499] mlm_loss=1.80423 mlm_acc=62.44149 nsp_loss=0.10039 nsp_acc=95.796 throughput=145.0K tks/s lr=0.0000520 time=146.41 INFO:root:[step 480749] mlm_loss=1.74387 mlm_acc=63.36750 nsp_loss=0.07809 nsp_acc=96.805 throughput=157.0K tks/s lr=0.0000519 time=160.12 INFO:root:[step 480999] mlm_loss=1.60547 mlm_acc=65.82278 nsp_loss=0.03728 nsp_acc=98.676 throughput=124.0K tks/s lr=0.0000519 time=127.19 INFO:root:[step 481249] mlm_loss=1.70250 mlm_acc=63.34453 nsp_loss=0.08400 nsp_acc=96.591 throughput=158.0K tks/s lr=0.0000519 time=159.08 INFO:root:[step 481499] mlm_loss=1.82539 mlm_acc=62.90407 nsp_loss=0.05528 nsp_acc=97.875 throughput=140.0K tks/s lr=0.0000519 time=139.05 INFO:root:[step 481749] mlm_loss=1.57087 mlm_acc=65.33162 nsp_loss=0.04611 nsp_acc=98.337 throughput=126.0K tks/s lr=0.0000518 time=129.48 INFO:root:[step 481999] mlm_loss=1.49364 mlm_acc=66.54777 nsp_loss=0.04203 nsp_acc=98.492 throughput=123.0K tks/s lr=0.0000518 time=125.65 INFO:root:[step 482249] mlm_loss=1.52602 mlm_acc=66.68048 nsp_loss=0.03638 nsp_acc=98.706 throughput=129.0K tks/s lr=0.0000518 time=111.52 INFO:root:[step 482499] mlm_loss=1.58931 mlm_acc=65.81248 nsp_loss=0.03974 nsp_acc=98.542 throughput=126.0K tks/s lr=0.0000518 time=126.20 INFO:root:[step 482749] mlm_loss=1.72857 mlm_acc=63.37178 nsp_loss=0.08462 nsp_acc=96.571 throughput=160.0K tks/s lr=0.0000517 time=161.75 INFO:root:[step 482999] mlm_loss=1.75860 mlm_acc=63.96621 nsp_loss=0.06510 nsp_acc=97.361 throughput=152.0K tks/s lr=0.0000517 time=155.46 INFO:root:[step 483249] mlm_loss=1.60183 mlm_acc=66.00575 nsp_loss=0.03856 nsp_acc=98.550 throughput=128.0K tks/s lr=0.0000517 time=127.00 INFO:root:[step 483499] mlm_loss=1.63232 mlm_acc=65.76148 nsp_loss=0.03161 nsp_acc=98.852 throughput=135.0K tks/s lr=0.0000517 time=128.31 INFO:root:[step 483749] mlm_loss=1.46462 mlm_acc=66.67904 nsp_loss=0.03741 nsp_acc=98.678 throughput=127.0K tks/s lr=0.0000516 time=117.64 INFO:root:[step 483999] mlm_loss=1.46905 mlm_acc=67.18394 nsp_loss=0.03749 nsp_acc=98.665 throughput=112.0K tks/s lr=0.0000516 time=118.30 INFO:root:[step 484249] mlm_loss=1.68638 mlm_acc=64.29900 nsp_loss=0.03584 nsp_acc=98.699 throughput=144.0K tks/s lr=0.0000516 time=137.80 INFO:root:[step 484499] mlm_loss=1.80191 mlm_acc=62.23580 nsp_loss=0.09215 nsp_acc=96.235 throughput=154.0K tks/s lr=0.0000516 time=158.78 INFO:root:[step 484749] mlm_loss=1.29796 mlm_acc=72.56658 nsp_loss=0.06265 nsp_acc=97.767 throughput=137.0K tks/s lr=0.0000515 time=141.27 INFO:root:[step 484999] mlm_loss=1.68461 mlm_acc=63.47897 nsp_loss=0.05070 nsp_acc=98.040 throughput=140.0K tks/s lr=0.0000515 time=137.57 INFO:root:[step 484999] Saving checkpoints to /home/ubuntu/ckpt-master/0484999.params, /home/ubuntu/ckpt-master/0484999.states. INFO:root:[step 485249] mlm_loss=1.66128 mlm_acc=65.26743 nsp_loss=0.03397 nsp_acc=98.799 throughput=122.0K tks/s lr=0.0000515 time=143.36 INFO:root:[step 485499] mlm_loss=1.66041 mlm_acc=65.04353 nsp_loss=0.03359 nsp_acc=98.804 throughput=141.0K tks/s lr=0.0000515 time=129.80 INFO:root:[step 485749] mlm_loss=1.53510 mlm_acc=66.03196 nsp_loss=0.06827 nsp_acc=97.412 throughput=122.0K tks/s lr=0.0000514 time=124.38 INFO:root:[step 485999] mlm_loss=1.44232 mlm_acc=66.56787 nsp_loss=0.06055 nsp_acc=97.666 throughput=128.0K tks/s lr=0.0000514 time=123.10 INFO:root:[step 486249] mlm_loss=1.57452 mlm_acc=64.86673 nsp_loss=0.05862 nsp_acc=97.800 throughput=137.0K tks/s lr=0.0000514 time=140.80 INFO:root:[step 486499] mlm_loss=1.59828 mlm_acc=65.62934 nsp_loss=0.03567 nsp_acc=98.703 throughput=128.0K tks/s lr=0.0000514 time=128.85 INFO:root:[step 486749] mlm_loss=1.55792 mlm_acc=66.63847 nsp_loss=0.03425 nsp_acc=98.789 throughput=134.0K tks/s lr=0.0000513 time=116.35 INFO:root:[step 486999] mlm_loss=1.71160 mlm_acc=63.33446 nsp_loss=0.12068 nsp_acc=94.923 throughput=143.0K tks/s lr=0.0000513 time=161.97 INFO:root:[step 487249] mlm_loss=1.39828 mlm_acc=67.33814 nsp_loss=0.04697 nsp_acc=98.285 throughput=115.0K tks/s lr=0.0000513 time=108.95 INFO:root:[step 487499] mlm_loss=1.50573 mlm_acc=65.95032 nsp_loss=0.03746 nsp_acc=98.668 throughput=129.0K tks/s lr=0.0000513 time=127.37 INFO:root:[step 487749] mlm_loss=1.48979 mlm_acc=67.11004 nsp_loss=0.04010 nsp_acc=98.596 throughput=123.0K tks/s lr=0.0000512 time=110.58 INFO:root:[step 487999] mlm_loss=1.61070 mlm_acc=66.16401 nsp_loss=0.03635 nsp_acc=98.655 throughput=134.0K tks/s lr=0.0000512 time=117.12 INFO:root:[step 488249] mlm_loss=1.61203 mlm_acc=65.89149 nsp_loss=0.03416 nsp_acc=98.796 throughput=131.0K tks/s lr=0.0000512 time=131.34 INFO:root:[step 488499] mlm_loss=1.59496 mlm_acc=64.85048 nsp_loss=0.07010 nsp_acc=97.213 throughput=137.0K tks/s lr=0.0000512 time=137.50 INFO:root:[step 488749] mlm_loss=1.55129 mlm_acc=66.69580 nsp_loss=0.03697 nsp_acc=98.646 throughput=132.0K tks/s lr=0.0000511 time=111.41 INFO:root:[step 488999] mlm_loss=1.65189 mlm_acc=65.37664 nsp_loss=0.03179 nsp_acc=98.895 throughput=130.0K tks/s lr=0.0000511 time=133.58 INFO:root:[step 489249] mlm_loss=1.41657 mlm_acc=67.09119 nsp_loss=0.05438 nsp_acc=97.947 throughput=107.0K tks/s lr=0.0000511 time=115.92 INFO:root:[step 489499] mlm_loss=1.58668 mlm_acc=64.82007 nsp_loss=0.05000 nsp_acc=98.094 throughput=145.0K tks/s lr=0.0000511 time=127.83 INFO:root:[step 489749] mlm_loss=1.55734 mlm_acc=65.33854 nsp_loss=0.07926 nsp_acc=96.810 throughput=137.0K tks/s lr=0.0000510 time=139.89 INFO:root:[step 489999] mlm_loss=1.49291 mlm_acc=67.12650 nsp_loss=0.03473 nsp_acc=98.792 throughput=118.0K tks/s lr=0.0000510 time=115.95 INFO:root:[step 489999] Saving checkpoints to /home/ubuntu/ckpt-master/0489999.params, /home/ubuntu/ckpt-master/0489999.states. INFO:root:[step 490249] mlm_loss=1.68978 mlm_acc=64.62709 nsp_loss=0.08476 nsp_acc=96.575 throughput=140.0K tks/s lr=0.0000510 time=171.66 INFO:root:[step 490499] mlm_loss=1.51197 mlm_acc=67.15744 nsp_loss=0.04274 nsp_acc=98.504 throughput=133.0K tks/s lr=0.0000510 time=129.11 INFO:root:[step 490749] mlm_loss=1.82788 mlm_acc=61.81256 nsp_loss=0.08190 nsp_acc=96.612 throughput=164.0K tks/s lr=0.0000509 time=173.28 INFO:root:[step 490999] mlm_loss=1.46899 mlm_acc=66.81164 nsp_loss=0.04971 nsp_acc=98.237 throughput=115.0K tks/s lr=0.0000509 time=123.95 INFO:root:[step 491249] mlm_loss=1.37721 mlm_acc=68.50611 nsp_loss=0.05511 nsp_acc=98.040 throughput=118.0K tks/s lr=0.0000509 time=107.09 INFO:root:[step 491499] mlm_loss=1.45931 mlm_acc=67.24614 nsp_loss=0.03924 nsp_acc=98.628 throughput=124.0K tks/s lr=0.0000509 time=111.07 INFO:root:[step 491749] mlm_loss=1.79578 mlm_acc=62.52255 nsp_loss=0.05176 nsp_acc=97.998 throughput=148.0K tks/s lr=0.0000508 time=160.56 INFO:root:[step 491999] mlm_loss=1.72003 mlm_acc=64.28565 nsp_loss=0.04335 nsp_acc=98.340 throughput=143.0K tks/s lr=0.0000508 time=147.04 INFO:root:[step 492249] mlm_loss=1.69997 mlm_acc=65.35688 nsp_loss=0.03094 nsp_acc=98.888 throughput=139.0K tks/s lr=0.0000508 time=138.10 INFO:root:[step 492499] mlm_loss=1.71196 mlm_acc=65.15389 nsp_loss=0.03000 nsp_acc=98.927 throughput=140.0K tks/s lr=0.0000508 time=137.21 INFO:root:[step 492749] mlm_loss=1.73574 mlm_acc=64.80171 nsp_loss=0.03260 nsp_acc=98.840 throughput=143.0K tks/s lr=0.0000507 time=138.88 INFO:root:[step 492999] mlm_loss=1.55207 mlm_acc=66.09218 nsp_loss=0.03842 nsp_acc=98.587 throughput=129.0K tks/s lr=0.0000507 time=118.79 INFO:root:[step 493249] mlm_loss=1.65474 mlm_acc=64.07189 nsp_loss=0.03710 nsp_acc=98.622 throughput=149.0K tks/s lr=0.0000507 time=146.97 INFO:root:[step 493499] mlm_loss=1.61277 mlm_acc=65.64522 nsp_loss=0.03271 nsp_acc=98.817 throughput=134.0K tks/s lr=0.0000507 time=134.31 INFO:root:[step 493749] mlm_loss=1.60560 mlm_acc=66.01169 nsp_loss=0.03366 nsp_acc=98.829 throughput=128.0K tks/s lr=0.0000506 time=130.28 INFO:root:[step 493999] mlm_loss=1.78481 mlm_acc=62.59349 nsp_loss=0.06259 nsp_acc=97.540 throughput=127.0K tks/s lr=0.0000506 time=117.41 INFO:root:[step 494249] mlm_loss=1.52940 mlm_acc=65.80023 nsp_loss=0.05357 nsp_acc=98.044 throughput=113.0K tks/s lr=0.0000506 time=118.97 INFO:root:[step 494499] mlm_loss=1.32730 mlm_acc=69.19007 nsp_loss=0.04743 nsp_acc=98.428 throughput=118.0K tks/s lr=0.0000506 time=108.74 INFO:root:[step 494749] mlm_loss=1.45957 mlm_acc=67.53352 nsp_loss=0.03859 nsp_acc=98.662 throughput=125.0K tks/s lr=0.0000505 time=108.83 INFO:root:[step 494999] mlm_loss=1.49955 mlm_acc=66.93844 nsp_loss=0.03908 nsp_acc=98.569 throughput=113.0K tks/s lr=0.0000505 time=118.55 INFO:root:[step 494999] Saving checkpoints to /home/ubuntu/ckpt-master/0494999.params, /home/ubuntu/ckpt-master/0494999.states. INFO:root:[step 495249] mlm_loss=1.41807 mlm_acc=67.41444 nsp_loss=0.04305 nsp_acc=98.433 throughput=101.0K tks/s lr=0.0000505 time=121.95 INFO:root:[step 495499] mlm_loss=1.54226 mlm_acc=66.34110 nsp_loss=0.03803 nsp_acc=98.628 throughput=127.0K tks/s lr=0.0000505 time=111.45 INFO:root:[step 495749] mlm_loss=1.45077 mlm_acc=66.79260 nsp_loss=0.04144 nsp_acc=98.537 throughput=116.0K tks/s lr=0.0000504 time=120.73 INFO:root:[step 495999] mlm_loss=1.75121 mlm_acc=62.88780 nsp_loss=0.04298 nsp_acc=98.414 throughput=142.0K tks/s lr=0.0000504 time=138.79 INFO:root:[step 496249] mlm_loss=1.77376 mlm_acc=63.12526 nsp_loss=0.05907 nsp_acc=97.743 throughput=146.0K tks/s lr=0.0000504 time=144.57 INFO:root:[step 496499] mlm_loss=1.66858 mlm_acc=64.00869 nsp_loss=0.04794 nsp_acc=98.150 throughput=141.0K tks/s lr=0.0000504 time=142.77 INFO:root:[step 496749] mlm_loss=1.40117 mlm_acc=67.80936 nsp_loss=0.04356 nsp_acc=98.466 throughput=114.0K tks/s lr=0.0000503 time=107.56 INFO:root:[step 496999] mlm_loss=1.64223 mlm_acc=64.59774 nsp_loss=0.10547 nsp_acc=95.483 throughput=134.0K tks/s lr=0.0000503 time=118.20 INFO:root:[step 497249] mlm_loss=1.60931 mlm_acc=65.63295 nsp_loss=0.04244 nsp_acc=98.437 throughput=129.0K tks/s lr=0.0000503 time=128.70 INFO:root:[step 497499] mlm_loss=1.72059 mlm_acc=62.81453 nsp_loss=0.05375 nsp_acc=97.920 throughput=153.0K tks/s lr=0.0000503 time=152.58 INFO:root:[step 497749] mlm_loss=1.84749 mlm_acc=61.87206 nsp_loss=0.07991 nsp_acc=96.872 throughput=147.0K tks/s lr=0.0000502 time=167.80 INFO:root:[step 497999] mlm_loss=1.49726 mlm_acc=66.88200 nsp_loss=0.03758 nsp_acc=98.649 throughput=127.0K tks/s lr=0.0000502 time=110.42 INFO:root:[step 498249] mlm_loss=1.62788 mlm_acc=64.77694 nsp_loss=0.09068 nsp_acc=96.129 throughput=136.0K tks/s lr=0.0000502 time=138.13 INFO:root:[step 498499] mlm_loss=1.53571 mlm_acc=66.68494 nsp_loss=0.03751 nsp_acc=98.650 throughput=129.0K tks/s lr=0.0000502 time=111.45 INFO:root:[step 498749] mlm_loss=1.50942 mlm_acc=66.63084 nsp_loss=0.03649 nsp_acc=98.678 throughput=120.0K tks/s lr=0.0000501 time=117.87 INFO:root:[step 498999] mlm_loss=1.69420 mlm_acc=63.60020 nsp_loss=0.03746 nsp_acc=98.631 throughput=140.0K tks/s lr=0.0000501 time=145.89 INFO:root:[step 499249] mlm_loss=1.45739 mlm_acc=67.39015 nsp_loss=0.03993 nsp_acc=98.579 throughput=118.0K tks/s lr=0.0000501 time=108.91 INFO:root:[step 499499] mlm_loss=1.42976 mlm_acc=67.75651 nsp_loss=0.04101 nsp_acc=98.508 throughput=118.0K tks/s lr=0.0000501 time=107.01 INFO:root:[step 499749] mlm_loss=1.44823 mlm_acc=67.47220 nsp_loss=0.03952 nsp_acc=98.672 throughput=115.0K tks/s lr=0.0000500 time=117.02 INFO:root:[step 499999] mlm_loss=1.67957 mlm_acc=65.14870 nsp_loss=0.02897 nsp_acc=98.948 throughput=141.0K tks/s lr=0.0000500 time=139.20 INFO:root:[step 499999] Saving checkpoints to /home/ubuntu/ckpt-master/0499999.params, /home/ubuntu/ckpt-master/0499999.states. INFO:root:[step 500249] mlm_loss=1.57170 mlm_acc=66.29845 nsp_loss=0.03675 nsp_acc=98.685 throughput=113.0K tks/s lr=0.0000500 time=132.49 INFO:root:[step 500499] mlm_loss=1.60573 mlm_acc=65.14471 nsp_loss=0.03626 nsp_acc=98.710 throughput=134.0K tks/s lr=0.0000500 time=124.92 INFO:root:[step 500749] mlm_loss=1.90936 mlm_acc=61.34093 nsp_loss=0.04985 nsp_acc=98.106 throughput=157.0K tks/s lr=0.0000499 time=160.83 INFO:root:[step 500999] mlm_loss=1.75321 mlm_acc=64.12317 nsp_loss=0.03163 nsp_acc=98.823 throughput=146.0K tks/s lr=0.0000499 time=145.46 INFO:root:[step 501249] mlm_loss=1.79787 mlm_acc=62.42782 nsp_loss=0.11262 nsp_acc=95.190 throughput=145.0K tks/s lr=0.0000499 time=160.16 INFO:root:[step 501499] mlm_loss=1.58727 mlm_acc=66.19843 nsp_loss=0.03336 nsp_acc=98.843 throughput=135.0K tks/s lr=0.0000499 time=120.10 INFO:root:[step 501749] mlm_loss=1.41336 mlm_acc=67.73582 nsp_loss=0.04024 nsp_acc=98.574 throughput=108.0K tks/s lr=0.0000498 time=113.06 INFO:root:[step 501999] mlm_loss=1.81374 mlm_acc=62.71831 nsp_loss=0.05843 nsp_acc=97.759 throughput=155.0K tks/s lr=0.0000498 time=154.08 INFO:root:[step 502249] mlm_loss=1.52127 mlm_acc=64.67860 nsp_loss=0.04847 nsp_acc=98.340 throughput=133.0K tks/s lr=0.0000498 time=122.40 INFO:root:[step 502499] mlm_loss=1.67080 mlm_acc=64.41507 nsp_loss=0.06350 nsp_acc=97.525 throughput=145.0K tks/s lr=0.0000498 time=156.49 INFO:root:[step 502749] mlm_loss=1.69675 mlm_acc=64.05072 nsp_loss=0.03786 nsp_acc=98.587 throughput=147.0K tks/s lr=0.0000497 time=147.78 INFO:root:[step 502999] mlm_loss=1.77253 mlm_acc=64.22492 nsp_loss=0.04695 nsp_acc=98.210 throughput=139.0K tks/s lr=0.0000497 time=138.72 INFO:root:[step 503249] mlm_loss=1.84991 mlm_acc=62.77070 nsp_loss=0.05030 nsp_acc=98.115 throughput=145.0K tks/s lr=0.0000497 time=140.83 INFO:root:[step 503499] mlm_loss=1.57511 mlm_acc=66.13477 nsp_loss=0.03745 nsp_acc=98.717 throughput=132.0K tks/s lr=0.0000497 time=118.83 INFO:root:[step 503749] mlm_loss=1.57727 mlm_acc=65.97953 nsp_loss=0.03767 nsp_acc=98.645 throughput=128.0K tks/s lr=0.0000496 time=127.84 INFO:root:[step 503999] mlm_loss=1.41281 mlm_acc=67.72951 nsp_loss=0.03877 nsp_acc=98.646 throughput=119.0K tks/s lr=0.0000496 time=109.08 INFO:root:[step 504249] mlm_loss=1.61816 mlm_acc=65.81615 nsp_loss=0.03720 nsp_acc=98.686 throughput=129.0K tks/s lr=0.0000496 time=126.01 INFO:root:[step 504499] mlm_loss=1.59847 mlm_acc=66.15280 nsp_loss=0.03291 nsp_acc=98.805 throughput=133.0K tks/s lr=0.0000496 time=131.66 INFO:root:[step 504749] mlm_loss=1.57934 mlm_acc=64.97611 nsp_loss=0.09274 nsp_acc=96.050 throughput=138.0K tks/s lr=0.0000495 time=123.57 INFO:root:[step 504999] mlm_loss=1.72109 mlm_acc=63.67531 nsp_loss=0.04738 nsp_acc=98.195 throughput=144.0K tks/s lr=0.0000495 time=155.71 INFO:root:[step 504999] Saving checkpoints to /home/ubuntu/ckpt-master/0504999.params, /home/ubuntu/ckpt-master/0504999.states. INFO:root:[step 505249] mlm_loss=1.64039 mlm_acc=66.31776 nsp_loss=0.03500 nsp_acc=98.766 throughput=132.0K tks/s lr=0.0000495 time=144.20 INFO:root:[step 505499] mlm_loss=1.88359 mlm_acc=61.42421 nsp_loss=0.10728 nsp_acc=95.598 throughput=150.0K tks/s lr=0.0000495 time=160.80 INFO:root:[step 505749] mlm_loss=1.76186 mlm_acc=63.10069 nsp_loss=0.05467 nsp_acc=97.899 throughput=149.0K tks/s lr=0.0000494 time=151.35 INFO:root:[step 505999] mlm_loss=1.56807 mlm_acc=65.19305 nsp_loss=0.05602 nsp_acc=97.839 throughput=136.0K tks/s lr=0.0000494 time=131.82 INFO:root:[step 506249] mlm_loss=1.60434 mlm_acc=64.72194 nsp_loss=0.04940 nsp_acc=98.153 throughput=144.0K tks/s lr=0.0000494 time=133.32 INFO:root:[step 506499] mlm_loss=1.44839 mlm_acc=67.67625 nsp_loss=0.04137 nsp_acc=98.500 throughput=109.0K tks/s lr=0.0000494 time=116.96 INFO:root:[step 506749] mlm_loss=1.47114 mlm_acc=67.44502 nsp_loss=0.03990 nsp_acc=98.605 throughput=122.0K tks/s lr=0.0000493 time=109.27 INFO:root:[step 506999] mlm_loss=1.45437 mlm_acc=67.21579 nsp_loss=0.05008 nsp_acc=98.141 throughput=117.0K tks/s lr=0.0000493 time=107.21 INFO:root:[step 507249] mlm_loss=1.64034 mlm_acc=65.66718 nsp_loss=0.03348 nsp_acc=98.782 throughput=131.0K tks/s lr=0.0000493 time=133.15 INFO:root:[step 507499] mlm_loss=1.59489 mlm_acc=65.95232 nsp_loss=0.03422 nsp_acc=98.769 throughput=129.0K tks/s lr=0.0000493 time=131.31 INFO:root:[step 507749] mlm_loss=1.40570 mlm_acc=68.33244 nsp_loss=0.04075 nsp_acc=98.577 throughput=114.0K tks/s lr=0.0000492 time=105.22 INFO:root:[step 508249] mlm_loss=3.22481 mlm_acc=64.86018 nsp_loss=0.08369 nsp_acc=98.466 throughput=136.0K tks/s lr=0.0000492 time=253.99 INFO:root:[step 508499] mlm_loss=1.67110 mlm_acc=64.03368 nsp_loss=0.07295 nsp_acc=97.124 throughput=137.0K tks/s lr=0.0000492 time=137.74 INFO:root:[step 508749] mlm_loss=1.51439 mlm_acc=66.57392 nsp_loss=0.03683 nsp_acc=98.706 throughput=118.0K tks/s lr=0.0000491 time=119.29 INFO:root:[step 509249] mlm_loss=3.31287 mlm_acc=64.69704 nsp_loss=0.07522 nsp_acc=98.643 throughput=142.0K tks/s lr=0.0000491 time=265.21 INFO:root:[step 509499] mlm_loss=1.56353 mlm_acc=66.47291 nsp_loss=0.03528 nsp_acc=98.740 throughput=125.0K tks/s lr=0.0000491 time=123.80 INFO:root:[step 509749] mlm_loss=1.83189 mlm_acc=62.32732 nsp_loss=0.04049 nsp_acc=98.471 throughput=151.0K tks/s lr=0.0000490 time=149.40 INFO:root:[step 509999] mlm_loss=1.65256 mlm_acc=64.14163 nsp_loss=0.05251 nsp_acc=98.005 throughput=143.0K tks/s lr=0.0000490 time=145.19 INFO:root:[step 509999] Saving checkpoints to /home/ubuntu/ckpt-master/0509999.params, /home/ubuntu/ckpt-master/0509999.states. INFO:root:[step 510249] mlm_loss=1.38042 mlm_acc=68.05914 nsp_loss=0.04595 nsp_acc=98.394 throughput=103.0K tks/s lr=0.0000490 time=132.08 INFO:root:[step 510499] mlm_loss=1.61308 mlm_acc=65.78958 nsp_loss=0.03550 nsp_acc=98.723 throughput=135.0K tks/s lr=0.0000490 time=122.72 INFO:root:[step 510749] mlm_loss=1.59298 mlm_acc=66.08617 nsp_loss=0.03575 nsp_acc=98.741 throughput=125.0K tks/s lr=0.0000489 time=127.28 INFO:root:[step 510999] mlm_loss=1.48378 mlm_acc=66.83926 nsp_loss=0.04220 nsp_acc=98.442 throughput=121.0K tks/s lr=0.0000489 time=112.91 INFO:root:[step 511249] mlm_loss=1.72487 mlm_acc=63.95832 nsp_loss=0.05267 nsp_acc=97.992 throughput=148.0K tks/s lr=0.0000489 time=142.82 INFO:root:[step 511499] mlm_loss=1.50796 mlm_acc=66.23835 nsp_loss=0.04355 nsp_acc=98.410 throughput=124.0K tks/s lr=0.0000489 time=124.80 INFO:root:[step 511749] mlm_loss=1.71762 mlm_acc=64.27380 nsp_loss=0.04386 nsp_acc=98.345 throughput=137.0K tks/s lr=0.0000488 time=134.21 INFO:root:[step 511999] mlm_loss=1.68718 mlm_acc=64.40719 nsp_loss=0.05369 nsp_acc=97.909 throughput=133.0K tks/s lr=0.0000488 time=131.29 INFO:root:[step 512249] mlm_loss=1.72133 mlm_acc=64.02715 nsp_loss=0.05427 nsp_acc=97.934 throughput=146.0K tks/s lr=0.0000488 time=150.13 INFO:root:[step 512499] mlm_loss=1.56997 mlm_acc=66.44667 nsp_loss=0.03653 nsp_acc=98.688 throughput=134.0K tks/s lr=0.0000488 time=114.91 INFO:root:[step 512749] mlm_loss=1.58555 mlm_acc=65.24166 nsp_loss=0.04867 nsp_acc=98.181 throughput=137.0K tks/s lr=0.0000487 time=135.11 INFO:root:[step 512999] mlm_loss=1.66346 mlm_acc=63.45027 nsp_loss=0.06544 nsp_acc=97.452 throughput=142.0K tks/s lr=0.0000487 time=142.73 INFO:root:[step 513249] mlm_loss=1.47278 mlm_acc=67.08591 nsp_loss=0.04068 nsp_acc=98.529 throughput=123.0K tks/s lr=0.0000487 time=110.62 INFO:root:[step 513499] mlm_loss=1.61375 mlm_acc=64.78265 nsp_loss=0.05515 nsp_acc=97.892 throughput=120.0K tks/s lr=0.0000487 time=122.97 INFO:root:[step 513749] mlm_loss=1.43574 mlm_acc=70.34510 nsp_loss=0.07918 nsp_acc=97.086 throughput=136.0K tks/s lr=0.0000486 time=140.82 INFO:root:[step 513999] mlm_loss=1.43935 mlm_acc=67.76660 nsp_loss=0.03939 nsp_acc=98.574 throughput=120.0K tks/s lr=0.0000486 time=106.85 INFO:root:[step 514249] mlm_loss=1.46979 mlm_acc=67.23241 nsp_loss=0.04043 nsp_acc=98.493 throughput=127.0K tks/s lr=0.0000486 time=110.57 INFO:root:[step 514499] mlm_loss=1.44853 mlm_acc=67.59550 nsp_loss=0.03986 nsp_acc=98.552 throughput=108.0K tks/s lr=0.0000486 time=115.06 INFO:root:[step 514749] mlm_loss=1.52639 mlm_acc=65.91383 nsp_loss=0.04226 nsp_acc=98.457 throughput=133.0K tks/s lr=0.0000485 time=115.13 INFO:root:[step 514999] mlm_loss=1.56973 mlm_acc=65.28969 nsp_loss=0.06029 nsp_acc=97.714 throughput=142.0K tks/s lr=0.0000485 time=143.71 INFO:root:[step 514999] Saving checkpoints to /home/ubuntu/ckpt-master/0514999.params, /home/ubuntu/ckpt-master/0514999.states. INFO:root:[step 515249] mlm_loss=1.38967 mlm_acc=67.76253 nsp_loss=0.04704 nsp_acc=98.278 throughput=101.0K tks/s lr=0.0000485 time=122.90 INFO:root:[step 515499] mlm_loss=1.61225 mlm_acc=66.05599 nsp_loss=0.03915 nsp_acc=98.607 throughput=126.0K tks/s lr=0.0000485 time=127.01 INFO:root:[step 515749] mlm_loss=1.76802 mlm_acc=62.81634 nsp_loss=0.04213 nsp_acc=98.416 throughput=149.0K tks/s lr=0.0000484 time=145.38 INFO:root:[step 515999] mlm_loss=1.66068 mlm_acc=65.08835 nsp_loss=0.03360 nsp_acc=98.744 throughput=137.0K tks/s lr=0.0000484 time=135.73 INFO:root:[step 516249] mlm_loss=1.60654 mlm_acc=64.73664 nsp_loss=0.07468 nsp_acc=96.957 throughput=134.0K tks/s lr=0.0000484 time=141.70 INFO:root:[step 516499] mlm_loss=1.58349 mlm_acc=65.20393 nsp_loss=0.07531 nsp_acc=96.978 throughput=139.0K tks/s lr=0.0000484 time=124.40 INFO:root:[step 516749] mlm_loss=1.52977 mlm_acc=66.67989 nsp_loss=0.03735 nsp_acc=98.668 throughput=118.0K tks/s lr=0.0000483 time=121.69 INFO:root:[step 516999] mlm_loss=1.42412 mlm_acc=67.74125 nsp_loss=0.03712 nsp_acc=98.708 throughput=123.0K tks/s lr=0.0000483 time=108.62 INFO:root:[step 517249] mlm_loss=1.51900 mlm_acc=65.39062 nsp_loss=0.05984 nsp_acc=97.803 throughput=137.0K tks/s lr=0.0000483 time=136.99 INFO:root:[step 517499] mlm_loss=1.40085 mlm_acc=68.08316 nsp_loss=0.04028 nsp_acc=98.591 throughput=119.0K tks/s lr=0.0000483 time=105.91 INFO:root:[step 517749] mlm_loss=1.67391 mlm_acc=65.04925 nsp_loss=0.02998 nsp_acc=98.936 throughput=142.0K tks/s lr=0.0000482 time=136.24 INFO:root:[step 517999] mlm_loss=1.46184 mlm_acc=69.16243 nsp_loss=0.04597 nsp_acc=98.386 throughput=128.0K tks/s lr=0.0000482 time=130.03 INFO:root:[step 518249] mlm_loss=1.17273 mlm_acc=73.11976 nsp_loss=0.05842 nsp_acc=97.936 throughput=123.0K tks/s lr=0.0000482 time=114.85 INFO:root:[step 518499] mlm_loss=1.53491 mlm_acc=65.96278 nsp_loss=0.04713 nsp_acc=98.291 throughput=126.0K tks/s lr=0.0000482 time=121.69 INFO:root:[step 518749] mlm_loss=1.54671 mlm_acc=65.01874 nsp_loss=0.05566 nsp_acc=97.913 throughput=138.0K tks/s lr=0.0000481 time=126.37 INFO:root:[step 518999] mlm_loss=1.59320 mlm_acc=64.61410 nsp_loss=0.05255 nsp_acc=98.006 throughput=140.0K tks/s lr=0.0000481 time=139.47 INFO:root:[step 519249] mlm_loss=1.67363 mlm_acc=64.45893 nsp_loss=0.05290 nsp_acc=97.952 throughput=143.0K tks/s lr=0.0000481 time=141.45 INFO:root:[step 519499] mlm_loss=1.74160 mlm_acc=64.34520 nsp_loss=0.03559 nsp_acc=98.626 throughput=146.0K tks/s lr=0.0000481 time=144.55 INFO:root:[step 519749] mlm_loss=1.77095 mlm_acc=63.15650 nsp_loss=0.03627 nsp_acc=98.665 throughput=146.0K tks/s lr=0.0000480 time=154.83 INFO:root:[step 519999] mlm_loss=1.45468 mlm_acc=66.59918 nsp_loss=0.04556 nsp_acc=98.386 throughput=130.0K tks/s lr=0.0000480 time=119.82 INFO:root:[step 519999] Saving checkpoints to /home/ubuntu/ckpt-master/0519999.params, /home/ubuntu/ckpt-master/0519999.states. INFO:root:[step 520249] mlm_loss=1.39382 mlm_acc=67.73733 nsp_loss=0.04337 nsp_acc=98.487 throughput=102.0K tks/s lr=0.0000480 time=129.30 INFO:root:[step 520499] mlm_loss=1.56530 mlm_acc=65.90493 nsp_loss=0.03458 nsp_acc=98.758 throughput=136.0K tks/s lr=0.0000480 time=123.30 INFO:root:[step 520749] mlm_loss=1.47211 mlm_acc=67.20722 nsp_loss=0.04140 nsp_acc=98.504 throughput=123.0K tks/s lr=0.0000479 time=120.84 INFO:root:[step 520999] mlm_loss=1.57683 mlm_acc=66.12400 nsp_loss=0.03857 nsp_acc=98.597 throughput=131.0K tks/s lr=0.0000479 time=120.32 INFO:root:[step 521249] mlm_loss=1.69747 mlm_acc=65.07927 nsp_loss=0.03501 nsp_acc=98.692 throughput=144.0K tks/s lr=0.0000479 time=139.94 INFO:root:[step 521499] mlm_loss=1.86181 mlm_acc=61.38811 nsp_loss=0.06308 nsp_acc=97.571 throughput=146.0K tks/s lr=0.0000479 time=168.73 INFO:root:[step 521749] mlm_loss=1.56917 mlm_acc=66.43422 nsp_loss=0.03436 nsp_acc=98.822 throughput=133.0K tks/s lr=0.0000478 time=115.90 INFO:root:[step 521999] mlm_loss=1.55147 mlm_acc=65.35523 nsp_loss=0.04347 nsp_acc=98.419 throughput=128.0K tks/s lr=0.0000478 time=122.92 INFO:root:[step 522249] mlm_loss=1.72753 mlm_acc=63.21167 nsp_loss=0.05072 nsp_acc=98.051 throughput=143.0K tks/s lr=0.0000478 time=143.81 INFO:root:[step 522499] mlm_loss=1.51425 mlm_acc=67.07548 nsp_loss=0.03665 nsp_acc=98.679 throughput=127.0K tks/s lr=0.0000478 time=112.47 INFO:root:[step 522749] mlm_loss=1.70261 mlm_acc=65.04089 nsp_loss=0.02963 nsp_acc=98.972 throughput=142.0K tks/s lr=0.0000477 time=138.91 INFO:root:[step 522999] mlm_loss=1.70393 mlm_acc=65.23762 nsp_loss=0.03229 nsp_acc=98.829 throughput=141.0K tks/s lr=0.0000477 time=137.66 INFO:root:[step 523249] mlm_loss=1.72659 mlm_acc=64.90435 nsp_loss=0.03170 nsp_acc=98.863 throughput=143.0K tks/s lr=0.0000477 time=155.06 INFO:root:[step 523499] mlm_loss=1.51820 mlm_acc=68.82543 nsp_loss=0.04297 nsp_acc=98.430 throughput=146.0K tks/s lr=0.0000477 time=131.22 INFO:root:[step 523749] mlm_loss=1.57364 mlm_acc=66.26123 nsp_loss=0.03975 nsp_acc=98.576 throughput=120.0K tks/s lr=0.0000476 time=123.52 INFO:root:[step 523999] mlm_loss=1.82500 mlm_acc=61.72380 nsp_loss=0.07311 nsp_acc=97.124 throughput=123.0K tks/s lr=0.0000476 time=128.12 INFO:root:[step 524249] mlm_loss=1.57740 mlm_acc=64.12399 nsp_loss=0.04180 nsp_acc=98.496 throughput=140.0K tks/s lr=0.0000476 time=118.75 INFO:root:[step 524499] mlm_loss=1.53909 mlm_acc=65.45077 nsp_loss=0.03942 nsp_acc=98.587 throughput=118.0K tks/s lr=0.0000476 time=127.79 INFO:root:[step 524749] mlm_loss=1.28412 mlm_acc=67.88252 nsp_loss=0.07751 nsp_acc=97.151 throughput=121.0K tks/s lr=0.0000475 time=107.67 INFO:root:[step 524999] mlm_loss=1.47086 mlm_acc=66.17524 nsp_loss=0.07164 nsp_acc=97.215 throughput=128.0K tks/s lr=0.0000475 time=119.82 INFO:root:[step 524999] Saving checkpoints to /home/ubuntu/ckpt-master/0524999.params, /home/ubuntu/ckpt-master/0524999.states. INFO:root:[step 525249] mlm_loss=1.53930 mlm_acc=65.45482 nsp_loss=0.04492 nsp_acc=98.318 throughput=110.0K tks/s lr=0.0000475 time=138.44 INFO:root:[step 525499] mlm_loss=1.78331 mlm_acc=63.52381 nsp_loss=0.03370 nsp_acc=98.722 throughput=153.0K tks/s lr=0.0000475 time=150.79 INFO:root:[step 525749] mlm_loss=1.68839 mlm_acc=65.31764 nsp_loss=0.03521 nsp_acc=98.742 throughput=136.0K tks/s lr=0.0000474 time=137.23 INFO:root:[step 525999] mlm_loss=1.62372 mlm_acc=65.09120 nsp_loss=0.04237 nsp_acc=98.447 throughput=138.0K tks/s lr=0.0000474 time=133.64 INFO:root:[step 526249] mlm_loss=1.72675 mlm_acc=64.01128 nsp_loss=0.04237 nsp_acc=98.448 throughput=141.0K tks/s lr=0.0000474 time=140.84 INFO:root:[step 526499] mlm_loss=1.59416 mlm_acc=66.21078 nsp_loss=0.03691 nsp_acc=98.641 throughput=133.0K tks/s lr=0.0000474 time=115.09 INFO:root:[step 526749] mlm_loss=1.47293 mlm_acc=67.26916 nsp_loss=0.04111 nsp_acc=98.559 throughput=113.0K tks/s lr=0.0000473 time=117.21 INFO:root:[step 526999] mlm_loss=1.66724 mlm_acc=65.74222 nsp_loss=0.03384 nsp_acc=98.753 throughput=135.0K tks/s lr=0.0000473 time=131.89 INFO:root:[step 527249] mlm_loss=1.64178 mlm_acc=66.06785 nsp_loss=0.03159 nsp_acc=98.904 throughput=142.0K tks/s lr=0.0000473 time=125.85 INFO:root:[step 527499] mlm_loss=1.61449 mlm_acc=66.04744 nsp_loss=0.03488 nsp_acc=98.713 throughput=128.0K tks/s lr=0.0000473 time=126.95 INFO:root:[step 527749] mlm_loss=1.66326 mlm_acc=63.86684 nsp_loss=0.06214 nsp_acc=97.617 throughput=142.0K tks/s lr=0.0000472 time=138.88 INFO:root:[step 527999] mlm_loss=1.71597 mlm_acc=64.15918 nsp_loss=0.05286 nsp_acc=97.914 throughput=141.0K tks/s lr=0.0000472 time=143.09 INFO:root:[step 528249] mlm_loss=1.55037 mlm_acc=66.75257 nsp_loss=0.04078 nsp_acc=98.520 throughput=127.0K tks/s lr=0.0000472 time=113.39 INFO:root:[step 528499] mlm_loss=1.59664 mlm_acc=65.87414 nsp_loss=0.03594 nsp_acc=98.703 throughput=131.0K tks/s lr=0.0000472 time=133.67 INFO:root:[step 528749] mlm_loss=1.60016 mlm_acc=65.74300 nsp_loss=0.05156 nsp_acc=98.019 throughput=136.0K tks/s lr=0.0000471 time=130.12 INFO:root:[step 528999] mlm_loss=1.73381 mlm_acc=62.96151 nsp_loss=0.08247 nsp_acc=96.659 throughput=147.0K tks/s lr=0.0000471 time=150.61 INFO:root:[step 529249] mlm_loss=1.61955 mlm_acc=65.84199 nsp_loss=0.03508 nsp_acc=98.750 throughput=134.0K tks/s lr=0.0000471 time=125.60 INFO:root:[step 529499] mlm_loss=1.68995 mlm_acc=65.46010 nsp_loss=0.06268 nsp_acc=97.556 throughput=147.0K tks/s lr=0.0000471 time=147.77 INFO:root:[step 529749] mlm_loss=1.40727 mlm_acc=69.04379 nsp_loss=0.06588 nsp_acc=97.538 throughput=156.0K tks/s lr=0.0000470 time=157.54 INFO:root:[step 529999] mlm_loss=1.55022 mlm_acc=66.32937 nsp_loss=0.03920 nsp_acc=98.646 throughput=122.0K tks/s lr=0.0000470 time=124.60 INFO:root:[step 529999] Saving checkpoints to /home/ubuntu/ckpt-master/0529999.params, /home/ubuntu/ckpt-master/0529999.states. INFO:root:[step 530249] mlm_loss=1.46749 mlm_acc=67.37468 nsp_loss=0.03647 nsp_acc=98.750 throughput=109.0K tks/s lr=0.0000470 time=124.96 INFO:root:[step 530499] mlm_loss=1.56711 mlm_acc=65.30710 nsp_loss=0.07054 nsp_acc=97.212 throughput=143.0K tks/s lr=0.0000470 time=140.45 INFO:root:[step 530749] mlm_loss=1.51294 mlm_acc=66.74214 nsp_loss=0.03510 nsp_acc=98.734 throughput=130.0K tks/s lr=0.0000469 time=115.71 INFO:root:[step 530999] mlm_loss=1.56037 mlm_acc=65.80922 nsp_loss=0.05062 nsp_acc=98.060 throughput=121.0K tks/s lr=0.0000469 time=121.67 INFO:root:[step 531249] mlm_loss=1.70055 mlm_acc=63.65505 nsp_loss=0.07282 nsp_acc=97.161 throughput=145.0K tks/s lr=0.0000469 time=149.14 INFO:root:[step 531499] mlm_loss=1.75565 mlm_acc=62.55980 nsp_loss=0.08706 nsp_acc=96.462 throughput=140.0K tks/s lr=0.0000469 time=133.31 INFO:root:[step 531749] mlm_loss=1.72341 mlm_acc=63.66974 nsp_loss=0.07691 nsp_acc=96.862 throughput=159.0K tks/s lr=0.0000468 time=166.27 INFO:root:[step 531999] mlm_loss=1.63622 mlm_acc=65.80573 nsp_loss=0.03519 nsp_acc=98.732 throughput=131.0K tks/s lr=0.0000468 time=129.18 INFO:root:[step 532249] mlm_loss=1.45191 mlm_acc=67.56383 nsp_loss=0.03963 nsp_acc=98.619 throughput=122.0K tks/s lr=0.0000468 time=108.51 INFO:root:[step 532499] mlm_loss=1.49808 mlm_acc=67.04942 nsp_loss=0.03807 nsp_acc=98.670 throughput=122.0K tks/s lr=0.0000468 time=122.35 INFO:root:[step 532749] mlm_loss=1.74887 mlm_acc=63.22685 nsp_loss=0.07572 nsp_acc=96.833 throughput=149.0K tks/s lr=0.0000467 time=146.47 INFO:root:[step 532999] mlm_loss=1.80146 mlm_acc=63.43433 nsp_loss=0.07231 nsp_acc=97.053 throughput=145.0K tks/s lr=0.0000467 time=145.03 INFO:root:[step 533249] mlm_loss=1.64728 mlm_acc=65.23767 nsp_loss=0.05530 nsp_acc=97.790 throughput=135.0K tks/s lr=0.0000467 time=137.09 INFO:root:[step 533499] mlm_loss=1.55558 mlm_acc=66.85561 nsp_loss=0.03502 nsp_acc=98.737 throughput=132.0K tks/s lr=0.0000467 time=117.58 INFO:root:[step 533749] mlm_loss=1.70582 mlm_acc=64.13944 nsp_loss=0.03297 nsp_acc=98.828 throughput=138.0K tks/s lr=0.0000466 time=150.47 INFO:root:[step 533999] mlm_loss=1.54759 mlm_acc=64.69170 nsp_loss=0.05469 nsp_acc=97.871 throughput=140.0K tks/s lr=0.0000466 time=123.57 INFO:root:[step 534249] mlm_loss=1.75653 mlm_acc=63.62181 nsp_loss=0.07322 nsp_acc=97.137 throughput=151.0K tks/s lr=0.0000466 time=151.69 INFO:root:[step 534499] mlm_loss=1.55192 mlm_acc=65.71005 nsp_loss=0.05626 nsp_acc=97.893 throughput=119.0K tks/s lr=0.0000466 time=118.88 INFO:root:[step 534749] mlm_loss=1.81937 mlm_acc=63.20943 nsp_loss=0.07952 nsp_acc=96.740 throughput=151.0K tks/s lr=0.0000465 time=153.19 INFO:root:[step 534999] mlm_loss=1.54453 mlm_acc=66.28272 nsp_loss=0.05179 nsp_acc=98.070 throughput=124.0K tks/s lr=0.0000465 time=125.79 INFO:root:[step 534999] Saving checkpoints to /home/ubuntu/ckpt-master/0534999.params, /home/ubuntu/ckpt-master/0534999.states. INFO:root:[step 535249] mlm_loss=1.55092 mlm_acc=66.92572 nsp_loss=0.03793 nsp_acc=98.643 throughput=113.0K tks/s lr=0.0000465 time=128.19 INFO:root:[step 535499] mlm_loss=1.53387 mlm_acc=66.04800 nsp_loss=0.04230 nsp_acc=98.470 throughput=126.0K tks/s lr=0.0000465 time=122.09 INFO:root:[step 535749] mlm_loss=1.52229 mlm_acc=65.01920 nsp_loss=0.04655 nsp_acc=98.274 throughput=139.0K tks/s lr=0.0000464 time=128.62 INFO:root:[step 535999] mlm_loss=1.67884 mlm_acc=64.04645 nsp_loss=0.04236 nsp_acc=98.424 throughput=146.0K tks/s lr=0.0000464 time=160.98 INFO:root:[step 536249] mlm_loss=1.43650 mlm_acc=67.49717 nsp_loss=0.03601 nsp_acc=98.703 throughput=123.0K tks/s lr=0.0000464 time=110.58 INFO:root:[step 536499] mlm_loss=1.24885 mlm_acc=69.24972 nsp_loss=0.04129 nsp_acc=98.553 throughput=107.0K tks/s lr=0.0000464 time=102.78 INFO:root:[step 536749] mlm_loss=1.53006 mlm_acc=64.94000 nsp_loss=0.06794 nsp_acc=97.295 throughput=133.0K tks/s lr=0.0000463 time=133.89 INFO:root:[step 536999] mlm_loss=1.62680 mlm_acc=65.71019 nsp_loss=0.02784 nsp_acc=98.995 throughput=136.0K tks/s lr=0.0000463 time=132.53 INFO:root:[step 537249] mlm_loss=1.46001 mlm_acc=67.11713 nsp_loss=0.03280 nsp_acc=98.871 throughput=133.0K tks/s lr=0.0000463 time=118.62 INFO:root:[step 537499] mlm_loss=1.56805 mlm_acc=66.28905 nsp_loss=0.02972 nsp_acc=98.971 throughput=129.0K tks/s lr=0.0000463 time=129.65 INFO:root:[step 537749] mlm_loss=1.91838 mlm_acc=61.07213 nsp_loss=0.05139 nsp_acc=98.047 throughput=151.0K tks/s lr=0.0000462 time=152.65 INFO:root:[step 537999] mlm_loss=1.64254 mlm_acc=64.17447 nsp_loss=0.04421 nsp_acc=98.340 throughput=129.0K tks/s lr=0.0000462 time=127.55 INFO:root:[step 538249] mlm_loss=1.36617 mlm_acc=70.13665 nsp_loss=0.05841 nsp_acc=97.874 throughput=153.0K tks/s lr=0.0000462 time=154.67 INFO:root:[step 538499] mlm_loss=1.59983 mlm_acc=65.10120 nsp_loss=0.05048 nsp_acc=98.119 throughput=150.0K tks/s lr=0.0000462 time=154.65 INFO:root:[step 538749] mlm_loss=1.80904 mlm_acc=61.62388 nsp_loss=0.05973 nsp_acc=97.655 throughput=146.0K tks/s lr=0.0000461 time=144.53 INFO:root:[step 538999] mlm_loss=1.65361 mlm_acc=64.29134 nsp_loss=0.05375 nsp_acc=98.106 throughput=145.0K tks/s lr=0.0000461 time=146.70 INFO:root:[step 539249] mlm_loss=1.39290 mlm_acc=68.21603 nsp_loss=0.03591 nsp_acc=98.706 throughput=114.0K tks/s lr=0.0000461 time=121.70 INFO:root:[step 539499] mlm_loss=1.40702 mlm_acc=67.86986 nsp_loss=0.03219 nsp_acc=98.845 throughput=120.0K tks/s lr=0.0000461 time=106.78 INFO:root:[step 539749] mlm_loss=1.78184 mlm_acc=62.34058 nsp_loss=0.05683 nsp_acc=97.786 throughput=127.0K tks/s lr=0.0000460 time=130.96 INFO:root:[step 539999] mlm_loss=1.42389 mlm_acc=67.47152 nsp_loss=0.04135 nsp_acc=98.477 throughput=115.0K tks/s lr=0.0000460 time=107.04 INFO:root:[step 539999] Saving checkpoints to /home/ubuntu/ckpt-master/0539999.params, /home/ubuntu/ckpt-master/0539999.states. INFO:root:[step 540249] mlm_loss=1.45321 mlm_acc=67.55644 nsp_loss=0.03885 nsp_acc=98.635 throughput=104.0K tks/s lr=0.0000460 time=122.22 INFO:root:[step 540499] mlm_loss=1.44215 mlm_acc=67.80179 nsp_loss=0.03476 nsp_acc=98.746 throughput=122.0K tks/s lr=0.0000460 time=112.38 INFO:root:[step 540749] mlm_loss=1.44327 mlm_acc=67.34122 nsp_loss=0.03694 nsp_acc=98.738 throughput=116.0K tks/s lr=0.0000459 time=117.89 INFO:root:[step 540999] mlm_loss=1.66867 mlm_acc=64.49773 nsp_loss=0.04280 nsp_acc=98.326 throughput=144.0K tks/s lr=0.0000459 time=146.84 INFO:root:[step 541249] mlm_loss=1.53206 mlm_acc=66.48777 nsp_loss=0.03609 nsp_acc=98.724 throughput=135.0K tks/s lr=0.0000459 time=116.49 INFO:root:[step 541499] mlm_loss=1.26715 mlm_acc=73.14374 nsp_loss=0.04814 nsp_acc=98.310 throughput=137.0K tks/s lr=0.0000459 time=137.14 INFO:root:[step 541749] mlm_loss=1.53470 mlm_acc=66.71918 nsp_loss=0.02949 nsp_acc=98.963 throughput=123.0K tks/s lr=0.0000458 time=124.22 INFO:root:[step 541999] mlm_loss=1.55139 mlm_acc=65.11163 nsp_loss=0.05596 nsp_acc=97.876 throughput=145.0K tks/s lr=0.0000458 time=127.26 INFO:root:[step 542249] mlm_loss=1.61118 mlm_acc=65.82640 nsp_loss=0.03024 nsp_acc=98.914 throughput=130.0K tks/s lr=0.0000458 time=128.87 INFO:root:[step 542499] mlm_loss=1.61182 mlm_acc=65.81755 nsp_loss=0.02792 nsp_acc=99.008 throughput=131.0K tks/s lr=0.0000458 time=135.36 INFO:root:[step 542749] mlm_loss=1.57338 mlm_acc=65.79293 nsp_loss=0.03514 nsp_acc=98.699 throughput=137.0K tks/s lr=0.0000457 time=130.86 INFO:root:[step 542999] mlm_loss=1.64249 mlm_acc=65.17120 nsp_loss=0.03965 nsp_acc=98.521 throughput=144.0K tks/s lr=0.0000457 time=142.47 INFO:root:[step 543249] mlm_loss=1.68660 mlm_acc=64.82265 nsp_loss=0.02432 nsp_acc=99.125 throughput=145.0K tks/s lr=0.0000457 time=143.65 INFO:root:[step 543499] mlm_loss=1.62907 mlm_acc=65.74508 nsp_loss=0.02936 nsp_acc=98.961 throughput=133.0K tks/s lr=0.0000457 time=129.65 INFO:root:[step 543749] mlm_loss=1.46820 mlm_acc=67.27981 nsp_loss=0.03429 nsp_acc=98.777 throughput=123.0K tks/s lr=0.0000456 time=111.55 INFO:root:[step 543999] mlm_loss=1.36245 mlm_acc=68.38903 nsp_loss=0.03127 nsp_acc=98.925 throughput=118.0K tks/s lr=0.0000456 time=108.36 INFO:root:[step 544249] mlm_loss=1.75069 mlm_acc=62.67859 nsp_loss=0.02881 nsp_acc=98.987 throughput=141.0K tks/s lr=0.0000456 time=159.80 INFO:root:[step 544499] mlm_loss=1.41130 mlm_acc=67.97621 nsp_loss=0.03217 nsp_acc=98.869 throughput=118.0K tks/s lr=0.0000456 time=108.48 INFO:root:[step 544749] mlm_loss=1.42512 mlm_acc=67.60119 nsp_loss=0.03666 nsp_acc=98.679 throughput=121.0K tks/s lr=0.0000455 time=108.36 INFO:root:[step 544999] mlm_loss=1.71594 mlm_acc=63.49856 nsp_loss=0.06333 nsp_acc=97.439 throughput=145.0K tks/s lr=0.0000455 time=161.07 INFO:root:[step 544999] Saving checkpoints to /home/ubuntu/ckpt-master/0544999.params, /home/ubuntu/ckpt-master/0544999.states. INFO:root:[step 545249] mlm_loss=1.50466 mlm_acc=66.87028 nsp_loss=0.03471 nsp_acc=98.735 throughput=117.0K tks/s lr=0.0000455 time=128.49 INFO:root:[step 545499] mlm_loss=1.39941 mlm_acc=67.97871 nsp_loss=0.03441 nsp_acc=98.856 throughput=122.0K tks/s lr=0.0000455 time=113.52 INFO:root:[step 545749] mlm_loss=1.69694 mlm_acc=64.06704 nsp_loss=0.04510 nsp_acc=98.338 throughput=138.0K tks/s lr=0.0000454 time=137.04 INFO:root:[step 545999] mlm_loss=1.59466 mlm_acc=65.31199 nsp_loss=0.03732 nsp_acc=98.645 throughput=133.0K tks/s lr=0.0000454 time=135.35 INFO:root:[step 546249] mlm_loss=1.61063 mlm_acc=65.37767 nsp_loss=0.02976 nsp_acc=98.935 throughput=137.0K tks/s lr=0.0000454 time=134.05 INFO:root:[step 546499] mlm_loss=1.56955 mlm_acc=66.43163 nsp_loss=0.03188 nsp_acc=98.876 throughput=124.0K tks/s lr=0.0000454 time=124.80 INFO:root:[step 546749] mlm_loss=1.56235 mlm_acc=66.16032 nsp_loss=0.03131 nsp_acc=98.908 throughput=140.0K tks/s lr=0.0000453 time=119.69 INFO:root:[step 546999] mlm_loss=1.63469 mlm_acc=64.58544 nsp_loss=0.03539 nsp_acc=98.719 throughput=137.0K tks/s lr=0.0000453 time=132.52 INFO:root:[step 547249] mlm_loss=1.42213 mlm_acc=67.24100 nsp_loss=0.03808 nsp_acc=98.698 throughput=124.0K tks/s lr=0.0000453 time=130.83 INFO:root:[step 547499] mlm_loss=1.28753 mlm_acc=72.54470 nsp_loss=0.03919 nsp_acc=98.698 throughput=142.0K tks/s lr=0.0000453 time=127.81 INFO:root:[step 547749] mlm_loss=1.48247 mlm_acc=66.25000 nsp_loss=0.03624 nsp_acc=98.778 throughput=131.0K tks/s lr=0.0000452 time=129.32 INFO:root:[step 547999] mlm_loss=1.42532 mlm_acc=67.44993 nsp_loss=0.03984 nsp_acc=98.617 throughput=123.0K tks/s lr=0.0000452 time=117.94 INFO:root:[step 548249] mlm_loss=1.65401 mlm_acc=65.03704 nsp_loss=0.05645 nsp_acc=97.743 throughput=157.0K tks/s lr=0.0000452 time=163.10 INFO:root:[step 548499] mlm_loss=1.59339 mlm_acc=64.29068 nsp_loss=0.06453 nsp_acc=97.477 throughput=143.0K tks/s lr=0.0000452 time=148.13 INFO:root:[step 548749] mlm_loss=1.48690 mlm_acc=67.10122 nsp_loss=0.03608 nsp_acc=98.743 throughput=125.0K tks/s lr=0.0000451 time=109.17 INFO:root:[step 548999] mlm_loss=1.38011 mlm_acc=68.26166 nsp_loss=0.03683 nsp_acc=98.691 throughput=106.0K tks/s lr=0.0000451 time=116.78 INFO:root:[step 549249] mlm_loss=1.42831 mlm_acc=67.74972 nsp_loss=0.03539 nsp_acc=98.768 throughput=125.0K tks/s lr=0.0000451 time=110.44 INFO:root:[step 549499] mlm_loss=1.59828 mlm_acc=65.40720 nsp_loss=0.05438 nsp_acc=97.936 throughput=148.0K tks/s lr=0.0000451 time=147.87 INFO:root:[step 549749] mlm_loss=1.66262 mlm_acc=65.67201 nsp_loss=0.02748 nsp_acc=99.020 throughput=137.0K tks/s lr=0.0000450 time=135.24 INFO:root:[step 549999] mlm_loss=1.62475 mlm_acc=66.02798 nsp_loss=0.02997 nsp_acc=98.934 throughput=133.0K tks/s lr=0.0000450 time=131.78 INFO:root:[step 549999] Saving checkpoints to /home/ubuntu/ckpt-master/0549999.params, /home/ubuntu/ckpt-master/0549999.states. INFO:root:[step 550249] mlm_loss=1.58490 mlm_acc=66.46155 nsp_loss=0.03227 nsp_acc=98.845 throughput=122.0K tks/s lr=0.0000450 time=136.73 INFO:root:[step 550499] mlm_loss=1.54887 mlm_acc=66.69275 nsp_loss=0.03148 nsp_acc=98.871 throughput=126.0K tks/s lr=0.0000450 time=127.48 INFO:root:[step 550749] mlm_loss=1.52970 mlm_acc=66.19565 nsp_loss=0.03349 nsp_acc=98.798 throughput=128.0K tks/s lr=0.0000449 time=128.99 INFO:root:[step 550999] mlm_loss=1.46094 mlm_acc=67.02152 nsp_loss=0.03543 nsp_acc=98.806 throughput=131.0K tks/s lr=0.0000449 time=114.63 INFO:root:[step 551249] mlm_loss=1.54622 mlm_acc=66.33672 nsp_loss=0.02947 nsp_acc=98.956 throughput=127.0K tks/s lr=0.0000449 time=128.55 INFO:root:[step 551499] mlm_loss=1.67271 mlm_acc=63.59711 nsp_loss=0.04157 nsp_acc=98.460 throughput=143.0K tks/s lr=0.0000449 time=145.98 INFO:root:[step 551749] mlm_loss=1.54291 mlm_acc=66.53201 nsp_loss=0.03063 nsp_acc=98.934 throughput=131.0K tks/s lr=0.0000448 time=125.62 INFO:root:[step 551999] mlm_loss=1.72585 mlm_acc=63.88110 nsp_loss=0.04120 nsp_acc=98.459 throughput=144.0K tks/s lr=0.0000448 time=147.48 INFO:root:[step 552249] mlm_loss=1.55608 mlm_acc=66.35388 nsp_loss=0.03264 nsp_acc=98.878 throughput=136.0K tks/s lr=0.0000448 time=117.62 INFO:root:[step 552499] mlm_loss=1.69322 mlm_acc=65.02465 nsp_loss=0.02343 nsp_acc=99.159 throughput=139.0K tks/s lr=0.0000448 time=153.37 INFO:root:[step 552749] mlm_loss=1.48952 mlm_acc=65.85206 nsp_loss=0.04612 nsp_acc=98.379 throughput=138.0K tks/s lr=0.0000447 time=117.77 INFO:root:[step 552999] mlm_loss=1.52551 mlm_acc=66.24855 nsp_loss=0.03689 nsp_acc=98.635 throughput=129.0K tks/s lr=0.0000447 time=131.87 INFO:root:[step 553249] mlm_loss=1.56196 mlm_acc=64.58116 nsp_loss=0.05102 nsp_acc=98.152 throughput=139.0K tks/s lr=0.0000447 time=135.32 INFO:root:[step 553499] mlm_loss=1.73867 mlm_acc=63.42521 nsp_loss=0.07810 nsp_acc=96.873 throughput=155.0K tks/s lr=0.0000447 time=158.90 INFO:root:[step 553749] mlm_loss=1.63935 mlm_acc=64.62310 nsp_loss=0.03511 nsp_acc=98.776 throughput=135.0K tks/s lr=0.0000446 time=139.14 INFO:root:[step 553999] mlm_loss=1.50620 mlm_acc=66.76184 nsp_loss=0.03339 nsp_acc=98.827 throughput=136.0K tks/s lr=0.0000446 time=116.44 INFO:root:[step 554249] mlm_loss=1.68465 mlm_acc=65.41188 nsp_loss=0.02686 nsp_acc=99.031 throughput=142.0K tks/s lr=0.0000446 time=138.39 INFO:root:[step 554499] mlm_loss=1.80229 mlm_acc=62.09067 nsp_loss=0.07280 nsp_acc=97.026 throughput=147.0K tks/s lr=0.0000446 time=164.86 INFO:root:[step 554749] mlm_loss=1.62532 mlm_acc=64.11320 nsp_loss=0.05067 nsp_acc=98.152 throughput=143.0K tks/s lr=0.0000445 time=141.51 INFO:root:[step 554999] mlm_loss=1.44653 mlm_acc=66.94466 nsp_loss=0.04759 nsp_acc=98.230 throughput=119.0K tks/s lr=0.0000445 time=112.77 INFO:root:[step 554999] Saving checkpoints to /home/ubuntu/ckpt-master/0554999.params, /home/ubuntu/ckpt-master/0554999.states. INFO:root:[step 555249] mlm_loss=1.61854 mlm_acc=64.35332 nsp_loss=0.05864 nsp_acc=97.676 throughput=125.0K tks/s lr=0.0000445 time=152.51 INFO:root:[step 555499] mlm_loss=1.50622 mlm_acc=67.24871 nsp_loss=0.03203 nsp_acc=98.894 throughput=129.0K tks/s lr=0.0000445 time=115.97 INFO:root:[step 555749] mlm_loss=1.55767 mlm_acc=65.20929 nsp_loss=0.05758 nsp_acc=97.849 throughput=138.0K tks/s lr=0.0000444 time=140.13 INFO:root:[step 555999] mlm_loss=1.36775 mlm_acc=67.74311 nsp_loss=0.05204 nsp_acc=98.027 throughput=111.0K tks/s lr=0.0000444 time=107.08 INFO:root:[step 556249] mlm_loss=1.41985 mlm_acc=67.62247 nsp_loss=0.04266 nsp_acc=98.486 throughput=110.0K tks/s lr=0.0000444 time=117.34 INFO:root:[step 556499] mlm_loss=1.61864 mlm_acc=65.86370 nsp_loss=0.03082 nsp_acc=98.901 throughput=132.0K tks/s lr=0.0000444 time=130.21 INFO:root:[step 556749] mlm_loss=1.66998 mlm_acc=65.52717 nsp_loss=0.02773 nsp_acc=99.043 throughput=146.0K tks/s lr=0.0000443 time=129.58 INFO:root:[step 556999] mlm_loss=1.65744 mlm_acc=65.69415 nsp_loss=0.02958 nsp_acc=98.940 throughput=138.0K tks/s lr=0.0000443 time=132.43 INFO:root:[step 557249] mlm_loss=1.57541 mlm_acc=66.22930 nsp_loss=0.03097 nsp_acc=98.941 throughput=130.0K tks/s lr=0.0000443 time=126.45 INFO:root:[step 557499] mlm_loss=1.57235 mlm_acc=66.08227 nsp_loss=0.03383 nsp_acc=98.782 throughput=130.0K tks/s lr=0.0000443 time=126.36 INFO:root:[step 557749] mlm_loss=1.78260 mlm_acc=63.14408 nsp_loss=0.04453 nsp_acc=98.285 throughput=148.0K tks/s lr=0.0000442 time=151.24 INFO:root:[step 557999] mlm_loss=1.64786 mlm_acc=65.69920 nsp_loss=0.02922 nsp_acc=98.984 throughput=138.0K tks/s lr=0.0000442 time=131.64 INFO:root:[step 558249] mlm_loss=1.71784 mlm_acc=64.25144 nsp_loss=0.04676 nsp_acc=98.278 throughput=151.0K tks/s lr=0.0000442 time=151.74 INFO:root:[step 558499] mlm_loss=1.60207 mlm_acc=66.17869 nsp_loss=0.03198 nsp_acc=98.893 throughput=134.0K tks/s lr=0.0000442 time=130.21 INFO:root:[step 558749] mlm_loss=1.51074 mlm_acc=66.83566 nsp_loss=0.03350 nsp_acc=98.821 throughput=130.0K tks/s lr=0.0000441 time=121.74 INFO:root:[step 558999] mlm_loss=1.60973 mlm_acc=65.94494 nsp_loss=0.02969 nsp_acc=98.944 throughput=138.0K tks/s lr=0.0000441 time=132.27 INFO:root:[step 559249] mlm_loss=1.48098 mlm_acc=67.05818 nsp_loss=0.03337 nsp_acc=98.797 throughput=120.0K tks/s lr=0.0000441 time=124.99 INFO:root:[step 559499] mlm_loss=1.49213 mlm_acc=66.42280 nsp_loss=0.04023 nsp_acc=98.501 throughput=135.0K tks/s lr=0.0000441 time=116.23 INFO:root:[step 559749] mlm_loss=1.60987 mlm_acc=65.17305 nsp_loss=0.05229 nsp_acc=98.098 throughput=138.0K tks/s lr=0.0000440 time=138.73 INFO:root:[step 559999] mlm_loss=1.63643 mlm_acc=65.44217 nsp_loss=0.03728 nsp_acc=98.616 throughput=141.0K tks/s lr=0.0000440 time=138.49 INFO:root:[step 559999] Saving checkpoints to /home/ubuntu/ckpt-master/0559999.params, /home/ubuntu/ckpt-master/0559999.states. INFO:root:[step 560249] mlm_loss=1.51574 mlm_acc=67.08135 nsp_loss=0.03368 nsp_acc=98.812 throughput=109.0K tks/s lr=0.0000440 time=140.10 INFO:root:[step 560499] mlm_loss=1.50578 mlm_acc=66.94335 nsp_loss=0.03233 nsp_acc=98.866 throughput=129.0K tks/s lr=0.0000440 time=115.27 INFO:root:[step 560749] mlm_loss=1.29481 mlm_acc=68.51800 nsp_loss=0.04301 nsp_acc=98.475 throughput=109.0K tks/s lr=0.0000439 time=108.94 INFO:root:[step 560999] mlm_loss=1.67623 mlm_acc=63.33712 nsp_loss=0.04812 nsp_acc=98.178 throughput=138.0K tks/s lr=0.0000439 time=140.31 INFO:root:[step 561249] mlm_loss=1.38872 mlm_acc=67.90059 nsp_loss=0.03789 nsp_acc=98.651 throughput=117.0K tks/s lr=0.0000439 time=109.92 INFO:root:[step 561499] mlm_loss=1.56249 mlm_acc=65.22462 nsp_loss=0.04787 nsp_acc=98.150 throughput=125.0K tks/s lr=0.0000439 time=124.97 INFO:root:[step 561749] mlm_loss=1.70051 mlm_acc=63.81665 nsp_loss=0.04724 nsp_acc=98.269 throughput=134.0K tks/s lr=0.0000438 time=132.64 INFO:root:[step 561999] mlm_loss=1.83446 mlm_acc=62.22975 nsp_loss=0.04093 nsp_acc=98.440 throughput=160.0K tks/s lr=0.0000438 time=165.38 INFO:root:[step 562249] mlm_loss=1.34953 mlm_acc=70.08509 nsp_loss=0.04643 nsp_acc=98.407 throughput=120.0K tks/s lr=0.0000438 time=124.75 INFO:root:[step 562499] mlm_loss=1.35276 mlm_acc=71.63741 nsp_loss=0.04657 nsp_acc=98.378 throughput=137.0K tks/s lr=0.0000438 time=123.44 INFO:root:[step 562749] mlm_loss=1.69218 mlm_acc=64.72103 nsp_loss=0.06148 nsp_acc=97.573 throughput=144.0K tks/s lr=0.0000437 time=155.97 INFO:root:[step 562999] mlm_loss=1.68116 mlm_acc=65.48888 nsp_loss=0.02672 nsp_acc=99.060 throughput=141.0K tks/s lr=0.0000437 time=138.42 INFO:root:[step 563249] mlm_loss=1.56807 mlm_acc=66.35776 nsp_loss=0.02977 nsp_acc=98.956 throughput=134.0K tks/s lr=0.0000437 time=122.12 INFO:root:[step 563499] mlm_loss=1.45749 mlm_acc=67.49976 nsp_loss=0.03855 nsp_acc=98.608 throughput=116.0K tks/s lr=0.0000437 time=119.92 INFO:root:[step 563749] mlm_loss=1.68252 mlm_acc=64.30263 nsp_loss=0.05786 nsp_acc=97.712 throughput=150.0K tks/s lr=0.0000436 time=151.10 INFO:root:[step 563999] mlm_loss=1.49570 mlm_acc=66.18536 nsp_loss=0.07250 nsp_acc=97.004 throughput=131.0K tks/s lr=0.0000436 time=118.82 INFO:root:[step 564249] mlm_loss=1.49369 mlm_acc=67.24815 nsp_loss=0.03558 nsp_acc=98.751 throughput=121.0K tks/s lr=0.0000436 time=121.15 INFO:root:[step 564499] mlm_loss=1.63859 mlm_acc=65.73578 nsp_loss=0.03448 nsp_acc=98.824 throughput=146.0K tks/s lr=0.0000436 time=140.95 INFO:root:[step 564749] mlm_loss=1.78766 mlm_acc=63.79753 nsp_loss=0.04704 nsp_acc=98.172 throughput=141.0K tks/s lr=0.0000435 time=141.26 INFO:root:[step 564999] mlm_loss=1.63913 mlm_acc=64.55066 nsp_loss=0.04998 nsp_acc=98.194 throughput=130.0K tks/s lr=0.0000435 time=126.76 INFO:root:[step 564999] Saving checkpoints to /home/ubuntu/ckpt-master/0564999.params, /home/ubuntu/ckpt-master/0564999.states. INFO:root:[step 565249] mlm_loss=1.68386 mlm_acc=64.32484 nsp_loss=0.04555 nsp_acc=98.261 throughput=131.0K tks/s lr=0.0000435 time=166.11 INFO:root:[step 565499] mlm_loss=1.55234 mlm_acc=66.69455 nsp_loss=0.03286 nsp_acc=98.839 throughput=134.0K tks/s lr=0.0000435 time=116.44 INFO:root:[step 565749] mlm_loss=1.68203 mlm_acc=65.37727 nsp_loss=0.03022 nsp_acc=98.880 throughput=144.0K tks/s lr=0.0000434 time=137.71 INFO:root:[step 565999] mlm_loss=1.68080 mlm_acc=65.46043 nsp_loss=0.02590 nsp_acc=99.073 throughput=143.0K tks/s lr=0.0000434 time=140.53 INFO:root:[step 566249] mlm_loss=1.71938 mlm_acc=63.49038 nsp_loss=0.07604 nsp_acc=97.003 throughput=146.0K tks/s lr=0.0000434 time=164.96 INFO:root:[step 566499] mlm_loss=1.62216 mlm_acc=64.17701 nsp_loss=0.03812 nsp_acc=98.601 throughput=142.0K tks/s lr=0.0000434 time=142.99 INFO:root:[step 566749] mlm_loss=1.45721 mlm_acc=67.37452 nsp_loss=0.03909 nsp_acc=98.664 throughput=121.0K tks/s lr=0.0000433 time=111.23 INFO:root:[step 566999] mlm_loss=1.55555 mlm_acc=65.62880 nsp_loss=0.03600 nsp_acc=98.690 throughput=130.0K tks/s lr=0.0000433 time=130.37 INFO:root:[step 567249] mlm_loss=1.53647 mlm_acc=66.61990 nsp_loss=0.03060 nsp_acc=98.943 throughput=136.0K tks/s lr=0.0000433 time=117.65 INFO:root:[step 567499] mlm_loss=1.54990 mlm_acc=65.11419 nsp_loss=0.08995 nsp_acc=96.290 throughput=128.0K tks/s lr=0.0000433 time=137.39 INFO:root:[step 567749] mlm_loss=1.55163 mlm_acc=66.68806 nsp_loss=0.03602 nsp_acc=98.697 throughput=128.0K tks/s lr=0.0000432 time=121.84 INFO:root:[step 567999] mlm_loss=1.72757 mlm_acc=64.89907 nsp_loss=0.05946 nsp_acc=97.686 throughput=145.0K tks/s lr=0.0000432 time=149.71 INFO:root:[step 568249] mlm_loss=1.52595 mlm_acc=67.00123 nsp_loss=0.03256 nsp_acc=98.858 throughput=132.0K tks/s lr=0.0000432 time=114.74 INFO:root:[step 568499] mlm_loss=1.79882 mlm_acc=63.44484 nsp_loss=0.05543 nsp_acc=97.828 throughput=143.0K tks/s lr=0.0000432 time=145.30 INFO:root:[step 568749] mlm_loss=1.83021 mlm_acc=62.15545 nsp_loss=0.04784 nsp_acc=98.161 throughput=149.0K tks/s lr=0.0000431 time=170.42 INFO:root:[step 568999] mlm_loss=1.49509 mlm_acc=67.08057 nsp_loss=0.03502 nsp_acc=98.792 throughput=126.0K tks/s lr=0.0000431 time=113.65 INFO:root:[step 569249] mlm_loss=1.57217 mlm_acc=66.64169 nsp_loss=0.03182 nsp_acc=98.862 throughput=131.0K tks/s lr=0.0000431 time=130.40 INFO:root:[step 569499] mlm_loss=1.65330 mlm_acc=65.78360 nsp_loss=0.02898 nsp_acc=98.977 throughput=136.0K tks/s lr=0.0000431 time=132.64 INFO:root:[step 569749] mlm_loss=1.42877 mlm_acc=67.48546 nsp_loss=0.04029 nsp_acc=98.606 throughput=124.0K tks/s lr=0.0000430 time=114.55 INFO:root:[step 569999] mlm_loss=1.39115 mlm_acc=67.77213 nsp_loss=0.04544 nsp_acc=98.423 throughput=121.0K tks/s lr=0.0000430 time=109.34 INFO:root:[step 569999] Saving checkpoints to /home/ubuntu/ckpt-master/0569999.params, /home/ubuntu/ckpt-master/0569999.states. INFO:root:[step 570249] mlm_loss=1.50328 mlm_acc=66.92875 nsp_loss=0.03640 nsp_acc=98.711 throughput=106.0K tks/s lr=0.0000430 time=136.45 INFO:root:[step 570499] mlm_loss=1.41557 mlm_acc=67.28598 nsp_loss=0.04111 nsp_acc=98.531 throughput=124.0K tks/s lr=0.0000430 time=114.77 INFO:root:[step 570749] mlm_loss=1.41789 mlm_acc=67.58725 nsp_loss=0.03966 nsp_acc=98.609 throughput=114.0K tks/s lr=0.0000429 time=118.23 INFO:root:[step 570999] mlm_loss=1.42008 mlm_acc=67.49443 nsp_loss=0.03872 nsp_acc=98.606 throughput=125.0K tks/s lr=0.0000429 time=109.86 INFO:root:[step 571249] mlm_loss=1.75760 mlm_acc=63.37590 nsp_loss=0.05335 nsp_acc=97.917 throughput=146.0K tks/s lr=0.0000429 time=144.77 INFO:root:[step 571499] mlm_loss=1.51414 mlm_acc=67.28459 nsp_loss=0.03515 nsp_acc=98.749 throughput=126.0K tks/s lr=0.0000429 time=112.09 INFO:root:[step 571749] mlm_loss=1.93040 mlm_acc=60.95230 nsp_loss=0.10530 nsp_acc=95.773 throughput=141.0K tks/s lr=0.0000428 time=159.94 INFO:root:[step 571999] mlm_loss=1.49951 mlm_acc=67.22053 nsp_loss=0.03637 nsp_acc=98.727 throughput=124.0K tks/s lr=0.0000428 time=113.15 INFO:root:[step 572249] mlm_loss=1.55495 mlm_acc=65.73893 nsp_loss=0.03177 nsp_acc=98.893 throughput=130.0K tks/s lr=0.0000428 time=131.45 INFO:root:[step 572499] mlm_loss=1.42295 mlm_acc=67.86484 nsp_loss=0.03524 nsp_acc=98.733 throughput=123.0K tks/s lr=0.0000428 time=110.73 INFO:root:[step 572749] mlm_loss=1.45742 mlm_acc=67.63968 nsp_loss=0.03661 nsp_acc=98.700 throughput=113.0K tks/s lr=0.0000427 time=120.06 INFO:root:[step 572999] mlm_loss=1.46172 mlm_acc=67.83554 nsp_loss=0.03678 nsp_acc=98.696 throughput=122.0K tks/s lr=0.0000427 time=107.98 INFO:root:[step 573249] mlm_loss=1.70746 mlm_acc=64.13531 nsp_loss=0.06035 nsp_acc=97.557 throughput=156.0K tks/s lr=0.0000427 time=153.85 INFO:root:[step 573499] mlm_loss=1.59201 mlm_acc=65.96866 nsp_loss=0.03356 nsp_acc=98.764 throughput=137.0K tks/s lr=0.0000427 time=133.68 INFO:root:[step 573749] mlm_loss=1.68967 mlm_acc=64.56740 nsp_loss=0.04128 nsp_acc=98.427 throughput=141.0K tks/s lr=0.0000426 time=141.45 INFO:root:[step 573999] mlm_loss=1.48227 mlm_acc=65.80266 nsp_loss=0.04815 nsp_acc=98.249 throughput=125.0K tks/s lr=0.0000426 time=113.76 INFO:root:[step 574249] mlm_loss=1.64696 mlm_acc=64.35509 nsp_loss=0.10583 nsp_acc=95.607 throughput=145.0K tks/s lr=0.0000426 time=162.16 INFO:root:[step 574499] mlm_loss=1.55588 mlm_acc=66.80729 nsp_loss=0.02962 nsp_acc=98.930 throughput=136.0K tks/s lr=0.0000426 time=118.52 INFO:root:[step 574749] mlm_loss=1.69954 mlm_acc=65.23083 nsp_loss=0.02739 nsp_acc=99.023 throughput=145.0K tks/s lr=0.0000425 time=143.93 INFO:root:[step 574999] mlm_loss=1.38371 mlm_acc=68.15028 nsp_loss=0.03961 nsp_acc=98.594 throughput=107.0K tks/s lr=0.0000425 time=115.83 INFO:root:[step 574999] Saving checkpoints to /home/ubuntu/ckpt-master/0574999.params, /home/ubuntu/ckpt-master/0574999.states. INFO:root:[step 575249] mlm_loss=1.51042 mlm_acc=66.14126 nsp_loss=0.03354 nsp_acc=98.826 throughput=121.0K tks/s lr=0.0000425 time=133.10 INFO:root:[step 575499] mlm_loss=1.55922 mlm_acc=66.57763 nsp_loss=0.03396 nsp_acc=98.814 throughput=127.0K tks/s lr=0.0000425 time=126.39 INFO:root:[step 575749] mlm_loss=1.60333 mlm_acc=65.38954 nsp_loss=0.03343 nsp_acc=98.746 throughput=140.0K tks/s lr=0.0000424 time=134.15 INFO:root:[step 575999] mlm_loss=1.73849 mlm_acc=64.01533 nsp_loss=0.04414 nsp_acc=98.275 throughput=152.0K tks/s lr=0.0000424 time=155.16 INFO:root:[step 576249] mlm_loss=1.71093 mlm_acc=64.53544 nsp_loss=0.04819 nsp_acc=98.130 throughput=151.0K tks/s lr=0.0000424 time=152.41 INFO:root:[step 576499] mlm_loss=1.47056 mlm_acc=66.92124 nsp_loss=0.03829 nsp_acc=98.537 throughput=127.0K tks/s lr=0.0000424 time=127.44 INFO:root:[step 576749] mlm_loss=1.71517 mlm_acc=64.16100 nsp_loss=0.08665 nsp_acc=96.277 throughput=145.0K tks/s lr=0.0000423 time=141.33 INFO:root:[step 576999] mlm_loss=1.60619 mlm_acc=66.15989 nsp_loss=0.03137 nsp_acc=98.911 throughput=130.0K tks/s lr=0.0000423 time=130.64 INFO:root:[step 577249] mlm_loss=1.61595 mlm_acc=63.77126 nsp_loss=0.03722 nsp_acc=98.634 throughput=140.0K tks/s lr=0.0000423 time=140.67 INFO:root:[step 577499] mlm_loss=1.42420 mlm_acc=67.62006 nsp_loss=0.04016 nsp_acc=98.613 throughput=120.0K tks/s lr=0.0000423 time=111.95 INFO:root:[step 577749] mlm_loss=1.54564 mlm_acc=66.44069 nsp_loss=0.03637 nsp_acc=98.693 throughput=134.0K tks/s lr=0.0000422 time=127.43 INFO:root:[step 577999] mlm_loss=1.56942 mlm_acc=66.79159 nsp_loss=0.03359 nsp_acc=98.825 throughput=131.0K tks/s lr=0.0000422 time=136.85 INFO:root:[step 578249] mlm_loss=1.41568 mlm_acc=67.93196 nsp_loss=0.05114 nsp_acc=98.164 throughput=132.0K tks/s lr=0.0000422 time=113.70 INFO:root:[step 578499] mlm_loss=1.71900 mlm_acc=64.91631 nsp_loss=0.02538 nsp_acc=99.070 throughput=147.0K tks/s lr=0.0000422 time=145.96 INFO:root:[step 578749] mlm_loss=1.43521 mlm_acc=67.66937 nsp_loss=0.03374 nsp_acc=98.821 throughput=114.0K tks/s lr=0.0000421 time=118.41 INFO:root:[step 578999] mlm_loss=1.46439 mlm_acc=67.71481 nsp_loss=0.03850 nsp_acc=98.638 throughput=118.0K tks/s lr=0.0000421 time=109.05 INFO:root:[step 579249] mlm_loss=1.62061 mlm_acc=64.26803 nsp_loss=0.09015 nsp_acc=96.391 throughput=134.0K tks/s lr=0.0000421 time=132.41 INFO:root:[step 579499] mlm_loss=1.65592 mlm_acc=65.81250 nsp_loss=0.02861 nsp_acc=98.958 throughput=146.0K tks/s lr=0.0000421 time=127.43 INFO:root:[step 579749] mlm_loss=1.78589 mlm_acc=63.12667 nsp_loss=0.05218 nsp_acc=97.907 throughput=150.0K tks/s lr=0.0000420 time=162.27 INFO:root:[step 579999] mlm_loss=1.54323 mlm_acc=67.50963 nsp_loss=0.05338 nsp_acc=97.939 throughput=155.0K tks/s lr=0.0000420 time=157.10 INFO:root:[step 579999] Saving checkpoints to /home/ubuntu/ckpt-master/0579999.params, /home/ubuntu/ckpt-master/0579999.states. INFO:root:[step 580249] mlm_loss=1.69981 mlm_acc=64.34119 nsp_loss=0.06359 nsp_acc=97.516 throughput=129.0K tks/s lr=0.0000420 time=156.05 INFO:root:[step 580499] mlm_loss=1.53967 mlm_acc=66.11501 nsp_loss=0.04304 nsp_acc=98.448 throughput=132.0K tks/s lr=0.0000420 time=129.19 INFO:root:[step 580749] mlm_loss=1.59524 mlm_acc=65.88078 nsp_loss=0.04479 nsp_acc=98.358 throughput=138.0K tks/s lr=0.0000419 time=140.79 INFO:root:[step 580999] mlm_loss=1.48204 mlm_acc=67.34722 nsp_loss=0.03322 nsp_acc=98.830 throughput=124.0K tks/s lr=0.0000419 time=111.11 INFO:root:[step 581249] mlm_loss=1.40153 mlm_acc=67.80388 nsp_loss=0.04243 nsp_acc=98.518 throughput=123.0K tks/s lr=0.0000419 time=109.85 INFO:root:[step 581499] mlm_loss=1.42953 mlm_acc=67.74230 nsp_loss=0.03715 nsp_acc=98.696 throughput=113.0K tks/s lr=0.0000419 time=118.97 INFO:root:[step 581749] mlm_loss=1.52473 mlm_acc=66.24833 nsp_loss=0.03147 nsp_acc=98.908 throughput=132.0K tks/s lr=0.0000418 time=129.35 INFO:root:[step 581999] mlm_loss=1.41408 mlm_acc=67.69161 nsp_loss=0.04226 nsp_acc=98.461 throughput=118.0K tks/s lr=0.0000418 time=109.18 INFO:root:[step 582249] mlm_loss=1.39794 mlm_acc=68.13353 nsp_loss=0.03862 nsp_acc=98.618 throughput=119.0K tks/s lr=0.0000418 time=106.51 INFO:root:[step 582499] mlm_loss=1.41087 mlm_acc=68.31507 nsp_loss=0.04182 nsp_acc=98.537 throughput=119.0K tks/s lr=0.0000418 time=106.17 INFO:root:[step 582749] mlm_loss=1.72736 mlm_acc=64.31230 nsp_loss=0.10195 nsp_acc=95.665 throughput=136.0K tks/s lr=0.0000417 time=137.83 INFO:root:[step 582999] mlm_loss=1.57558 mlm_acc=66.04232 nsp_loss=0.04391 nsp_acc=98.331 throughput=132.0K tks/s lr=0.0000417 time=129.98 INFO:root:[step 583249] mlm_loss=1.60984 mlm_acc=64.94465 nsp_loss=0.04933 nsp_acc=98.147 throughput=143.0K tks/s lr=0.0000417 time=147.15 INFO:root:[step 583499] mlm_loss=1.57860 mlm_acc=66.13078 nsp_loss=0.03176 nsp_acc=98.870 throughput=135.0K tks/s lr=0.0000417 time=131.02 INFO:root:[step 583749] mlm_loss=1.49966 mlm_acc=67.17012 nsp_loss=0.03713 nsp_acc=98.699 throughput=126.0K tks/s lr=0.0000416 time=114.65 INFO:root:[step 583999] mlm_loss=1.53447 mlm_acc=66.39595 nsp_loss=0.03043 nsp_acc=98.953 throughput=133.0K tks/s lr=0.0000416 time=130.61 INFO:root:[step 584249] mlm_loss=1.46070 mlm_acc=67.55953 nsp_loss=0.03614 nsp_acc=98.695 throughput=124.0K tks/s lr=0.0000416 time=112.85 INFO:root:[step 584499] mlm_loss=1.48647 mlm_acc=67.19176 nsp_loss=0.03423 nsp_acc=98.816 throughput=117.0K tks/s lr=0.0000416 time=121.25 INFO:root:[step 584749] mlm_loss=1.60126 mlm_acc=64.49366 nsp_loss=0.05288 nsp_acc=97.968 throughput=146.0K tks/s lr=0.0000415 time=141.22 INFO:root:[step 584999] mlm_loss=1.67779 mlm_acc=64.70793 nsp_loss=0.04383 nsp_acc=98.330 throughput=141.0K tks/s lr=0.0000415 time=145.49 INFO:root:[step 584999] Saving checkpoints to /home/ubuntu/ckpt-master/0584999.params, /home/ubuntu/ckpt-master/0584999.states. INFO:root:[step 585249] mlm_loss=1.43199 mlm_acc=67.84727 nsp_loss=0.03478 nsp_acc=98.832 throughput=107.0K tks/s lr=0.0000415 time=123.95 INFO:root:[step 585499] mlm_loss=1.57754 mlm_acc=65.74812 nsp_loss=0.03941 nsp_acc=98.476 throughput=139.0K tks/s lr=0.0000415 time=133.75 INFO:root:[step 585749] mlm_loss=1.54655 mlm_acc=66.12118 nsp_loss=0.04382 nsp_acc=98.388 throughput=131.0K tks/s lr=0.0000414 time=135.17 INFO:root:[step 585999] mlm_loss=1.43538 mlm_acc=67.53521 nsp_loss=0.03979 nsp_acc=98.580 throughput=122.0K tks/s lr=0.0000414 time=111.08 INFO:root:[step 586249] mlm_loss=1.57692 mlm_acc=64.75651 nsp_loss=0.07883 nsp_acc=96.880 throughput=148.0K tks/s lr=0.0000414 time=147.05 INFO:root:[step 586499] mlm_loss=1.55802 mlm_acc=65.06810 nsp_loss=0.04479 nsp_acc=98.309 throughput=127.0K tks/s lr=0.0000414 time=127.37 INFO:root:[step 586749] mlm_loss=1.69105 mlm_acc=64.27183 nsp_loss=0.04499 nsp_acc=98.289 throughput=139.0K tks/s lr=0.0000413 time=142.21 INFO:root:[step 586999] mlm_loss=1.44748 mlm_acc=67.65928 nsp_loss=0.03997 nsp_acc=98.605 throughput=119.0K tks/s lr=0.0000413 time=110.60 INFO:root:[step 587249] mlm_loss=1.41908 mlm_acc=67.83180 nsp_loss=0.03890 nsp_acc=98.643 throughput=119.0K tks/s lr=0.0000413 time=109.49 INFO:root:[step 587499] mlm_loss=1.77954 mlm_acc=63.67218 nsp_loss=0.05385 nsp_acc=97.926 throughput=132.0K tks/s lr=0.0000413 time=134.09 INFO:root:[step 587749] mlm_loss=1.82967 mlm_acc=62.79991 nsp_loss=0.05165 nsp_acc=97.975 throughput=139.0K tks/s lr=0.0000412 time=137.55 INFO:root:[step 587999] mlm_loss=1.56906 mlm_acc=64.64199 nsp_loss=0.05010 nsp_acc=98.088 throughput=133.0K tks/s lr=0.0000412 time=129.54 INFO:root:[step 588249] mlm_loss=1.66792 mlm_acc=64.65374 nsp_loss=0.05506 nsp_acc=97.876 throughput=157.0K tks/s lr=0.0000412 time=161.95 INFO:root:[step 588499] mlm_loss=1.71084 mlm_acc=64.32575 nsp_loss=0.06880 nsp_acc=97.238 throughput=149.0K tks/s lr=0.0000412 time=163.64 INFO:root:[step 588749] mlm_loss=1.70350 mlm_acc=64.32290 nsp_loss=0.12335 nsp_acc=94.789 throughput=140.0K tks/s lr=0.0000411 time=151.07 INFO:root:[step 588999] mlm_loss=1.42644 mlm_acc=67.70802 nsp_loss=0.03948 nsp_acc=98.593 throughput=121.0K tks/s lr=0.0000411 time=110.09 INFO:root:[step 589249] mlm_loss=1.49068 mlm_acc=67.01489 nsp_loss=0.03588 nsp_acc=98.755 throughput=127.0K tks/s lr=0.0000411 time=109.53 INFO:root:[step 589499] mlm_loss=1.53579 mlm_acc=65.30226 nsp_loss=0.06463 nsp_acc=97.450 throughput=134.0K tks/s lr=0.0000411 time=139.21 INFO:root:[step 589749] mlm_loss=1.66292 mlm_acc=63.05293 nsp_loss=0.06719 nsp_acc=97.325 throughput=142.0K tks/s lr=0.0000410 time=136.40 INFO:root:[step 589999] mlm_loss=1.75025 mlm_acc=62.82701 nsp_loss=0.11074 nsp_acc=95.265 throughput=156.0K tks/s lr=0.0000410 time=159.48 INFO:root:[step 589999] Saving checkpoints to /home/ubuntu/ckpt-master/0589999.params, /home/ubuntu/ckpt-master/0589999.states. INFO:root:[step 590249] mlm_loss=1.57393 mlm_acc=65.88753 nsp_loss=0.04091 nsp_acc=98.550 throughput=116.0K tks/s lr=0.0000410 time=142.78 INFO:root:[step 590499] mlm_loss=1.62048 mlm_acc=66.09808 nsp_loss=0.03140 nsp_acc=98.903 throughput=129.0K tks/s lr=0.0000410 time=131.20 INFO:root:[step 590749] mlm_loss=1.42098 mlm_acc=67.95345 nsp_loss=0.03751 nsp_acc=98.664 throughput=118.0K tks/s lr=0.0000409 time=108.18 INFO:root:[step 590999] mlm_loss=1.54296 mlm_acc=66.64732 nsp_loss=0.03678 nsp_acc=98.735 throughput=132.0K tks/s lr=0.0000409 time=114.69 INFO:root:[step 591249] mlm_loss=1.90596 mlm_acc=61.30048 nsp_loss=0.07032 nsp_acc=97.158 throughput=148.0K tks/s lr=0.0000409 time=163.16 INFO:root:[step 591499] mlm_loss=1.52192 mlm_acc=66.40748 nsp_loss=0.06758 nsp_acc=97.303 throughput=135.0K tks/s lr=0.0000409 time=120.78 INFO:root:[step 591749] mlm_loss=1.64717 mlm_acc=65.65464 nsp_loss=0.02944 nsp_acc=98.934 throughput=142.0K tks/s lr=0.0000408 time=137.59 INFO:root:[step 591999] mlm_loss=1.62918 mlm_acc=64.10752 nsp_loss=0.05264 nsp_acc=97.947 throughput=140.0K tks/s lr=0.0000408 time=143.40 INFO:root:[step 592249] mlm_loss=1.53406 mlm_acc=65.17208 nsp_loss=0.05530 nsp_acc=97.922 throughput=136.0K tks/s lr=0.0000408 time=138.73 INFO:root:[step 592499] mlm_loss=1.50312 mlm_acc=66.79524 nsp_loss=0.03721 nsp_acc=98.667 throughput=128.0K tks/s lr=0.0000408 time=114.95 INFO:root:[step 592749] mlm_loss=1.42467 mlm_acc=68.03946 nsp_loss=0.03761 nsp_acc=98.678 throughput=109.0K tks/s lr=0.0000407 time=116.62 INFO:root:[step 592999] mlm_loss=1.56595 mlm_acc=65.36853 nsp_loss=0.06495 nsp_acc=97.422 throughput=140.0K tks/s lr=0.0000407 time=137.50 INFO:root:[step 593249] mlm_loss=1.53852 mlm_acc=66.75920 nsp_loss=0.03656 nsp_acc=98.699 throughput=134.0K tks/s lr=0.0000407 time=116.48 INFO:root:[step 593499] mlm_loss=1.49860 mlm_acc=67.13716 nsp_loss=0.03453 nsp_acc=98.820 throughput=119.0K tks/s lr=0.0000407 time=119.46 INFO:root:[step 593749] mlm_loss=1.61961 mlm_acc=66.32730 nsp_loss=0.02899 nsp_acc=98.981 throughput=141.0K tks/s lr=0.0000406 time=121.76 INFO:root:[step 593999] mlm_loss=1.68049 mlm_acc=64.69055 nsp_loss=0.04923 nsp_acc=98.111 throughput=147.0K tks/s lr=0.0000406 time=156.35 INFO:root:[step 594249] mlm_loss=1.57558 mlm_acc=64.58383 nsp_loss=0.04974 nsp_acc=98.197 throughput=142.0K tks/s lr=0.0000406 time=132.09 INFO:root:[step 594499] mlm_loss=1.71955 mlm_acc=64.22939 nsp_loss=0.04672 nsp_acc=98.223 throughput=140.0K tks/s lr=0.0000406 time=134.33 INFO:root:[step 594749] mlm_loss=1.56495 mlm_acc=66.03610 nsp_loss=0.04008 nsp_acc=98.489 throughput=127.0K tks/s lr=0.0000405 time=124.18 INFO:root:overflow detected. set loss_scale = 256.0 INFO:root:[step 594999] mlm_loss=1.72323 mlm_acc=63.58626 nsp_loss=0.05681 nsp_acc=97.694 throughput=157.0K tks/s lr=0.0000405 time=160.35 INFO:root:[step 594999] Saving checkpoints to /home/ubuntu/ckpt-master/0594999.params, /home/ubuntu/ckpt-master/0594999.states. INFO:root:[step 595249] mlm_loss=1.35259 mlm_acc=67.38814 nsp_loss=0.05517 nsp_acc=98.028 throughput=103.0K tks/s lr=0.0000405 time=135.37 INFO:root:[step 595499] mlm_loss=1.54207 mlm_acc=66.20358 nsp_loss=0.03573 nsp_acc=98.751 throughput=134.0K tks/s lr=0.0000405 time=120.94 INFO:root:[step 595749] mlm_loss=1.61615 mlm_acc=64.55037 nsp_loss=0.05975 nsp_acc=97.717 throughput=140.0K tks/s lr=0.0000404 time=139.05 INFO:root:[step 595999] mlm_loss=1.63367 mlm_acc=65.07897 nsp_loss=0.09266 nsp_acc=96.170 throughput=136.0K tks/s lr=0.0000404 time=136.16 INFO:root:[step 596249] mlm_loss=1.68486 mlm_acc=64.84319 nsp_loss=0.08330 nsp_acc=96.692 throughput=142.0K tks/s lr=0.0000404 time=139.00 INFO:root:[step 596499] mlm_loss=1.65034 mlm_acc=65.34437 nsp_loss=0.03306 nsp_acc=98.786 throughput=138.0K tks/s lr=0.0000404 time=132.76 INFO:root:[step 596749] mlm_loss=1.77255 mlm_acc=61.88267 nsp_loss=0.05767 nsp_acc=97.822 throughput=149.0K tks/s lr=0.0000403 time=154.59 INFO:root:[step 596999] mlm_loss=1.53389 mlm_acc=66.82998 nsp_loss=0.03478 nsp_acc=98.758 throughput=131.0K tks/s lr=0.0000403 time=114.81 INFO:root:[step 597249] mlm_loss=1.47955 mlm_acc=66.48198 nsp_loss=0.05926 nsp_acc=97.761 throughput=121.0K tks/s lr=0.0000403 time=124.25 INFO:root:[step 597499] mlm_loss=1.51411 mlm_acc=65.62829 nsp_loss=0.06255 nsp_acc=97.616 throughput=133.0K tks/s lr=0.0000403 time=119.34 INFO:root:[step 597749] mlm_loss=1.63562 mlm_acc=64.88481 nsp_loss=0.05130 nsp_acc=98.098 throughput=142.0K tks/s lr=0.0000402 time=137.52 INFO:root:[step 597999] mlm_loss=1.45557 mlm_acc=66.59335 nsp_loss=0.04569 nsp_acc=98.308 throughput=121.0K tks/s lr=0.0000402 time=123.19 INFO:root:[step 598249] mlm_loss=1.65659 mlm_acc=64.74722 nsp_loss=0.05078 nsp_acc=98.092 throughput=136.0K tks/s lr=0.0000402 time=137.55 INFO:root:[step 598499] mlm_loss=1.54664 mlm_acc=66.93249 nsp_loss=0.03393 nsp_acc=98.840 throughput=130.0K tks/s lr=0.0000402 time=114.18 INFO:root:[step 598749] mlm_loss=1.50834 mlm_acc=66.93514 nsp_loss=0.04469 nsp_acc=98.367 throughput=119.0K tks/s lr=0.0000401 time=121.14 INFO:root:[step 598999] mlm_loss=1.59289 mlm_acc=66.54508 nsp_loss=0.03001 nsp_acc=98.940 throughput=137.0K tks/s lr=0.0000401 time=121.88 INFO:root:[step 599249] mlm_loss=1.56402 mlm_acc=64.89178 nsp_loss=0.04756 nsp_acc=98.182 throughput=138.0K tks/s lr=0.0000401 time=141.07 INFO:root:[step 599499] mlm_loss=1.55235 mlm_acc=66.39986 nsp_loss=0.03448 nsp_acc=98.766 throughput=129.0K tks/s lr=0.0000401 time=123.22 INFO:root:[step 599749] mlm_loss=1.55176 mlm_acc=65.11871 nsp_loss=0.04315 nsp_acc=98.419 throughput=137.0K tks/s lr=0.0000400 time=139.84 INFO:root:[step 599999] mlm_loss=1.53873 mlm_acc=67.00640 nsp_loss=0.03204 nsp_acc=98.852 throughput=133.0K tks/s lr=0.0000400 time=117.70 INFO:root:[step 599999] Saving checkpoints to /home/ubuntu/ckpt-master/0599999.params, /home/ubuntu/ckpt-master/0599999.states. INFO:root:[step 600249] mlm_loss=1.45160 mlm_acc=68.09866 nsp_loss=0.03677 nsp_acc=98.690 throughput=111.0K tks/s lr=0.0000400 time=126.32 INFO:root:[step 600499] mlm_loss=1.45744 mlm_acc=67.53627 nsp_loss=0.03539 nsp_acc=98.716 throughput=114.0K tks/s lr=0.0000400 time=119.45 INFO:root:[step 600749] mlm_loss=1.42748 mlm_acc=67.71060 nsp_loss=0.04097 nsp_acc=98.535 throughput=115.0K tks/s lr=0.0000399 time=105.37 INFO:root:[step 600999] mlm_loss=1.53596 mlm_acc=66.68106 nsp_loss=0.03418 nsp_acc=98.776 throughput=126.0K tks/s lr=0.0000399 time=125.44 INFO:root:[step 601249] mlm_loss=1.49451 mlm_acc=67.26632 nsp_loss=0.03449 nsp_acc=98.803 throughput=128.0K tks/s lr=0.0000399 time=112.39 INFO:root:[step 601499] mlm_loss=1.35713 mlm_acc=68.95294 nsp_loss=0.04369 nsp_acc=98.494 throughput=124.0K tks/s lr=0.0000399 time=112.17 INFO:root:[step 601749] mlm_loss=1.56171 mlm_acc=66.91657 nsp_loss=0.03475 nsp_acc=98.767 throughput=125.0K tks/s lr=0.0000398 time=126.02 INFO:root:[step 601999] mlm_loss=1.55564 mlm_acc=66.76533 nsp_loss=0.03512 nsp_acc=98.730 throughput=127.0K tks/s lr=0.0000398 time=122.22 INFO:root:[step 602249] mlm_loss=1.55752 mlm_acc=66.14980 nsp_loss=0.03238 nsp_acc=98.835 throughput=134.0K tks/s lr=0.0000398 time=124.19 INFO:root:[step 602499] mlm_loss=1.59166 mlm_acc=65.54883 nsp_loss=0.04672 nsp_acc=98.235 throughput=143.0K tks/s lr=0.0000398 time=138.46 INFO:root:[step 602749] mlm_loss=1.29133 mlm_acc=68.28056 nsp_loss=0.05403 nsp_acc=98.057 throughput=116.0K tks/s lr=0.0000397 time=120.92 INFO:root:[step 602999] mlm_loss=1.51726 mlm_acc=67.42185 nsp_loss=0.03185 nsp_acc=98.869 throughput=131.0K tks/s lr=0.0000397 time=116.10 INFO:root:[step 603249] mlm_loss=1.54745 mlm_acc=66.36625 nsp_loss=0.03375 nsp_acc=98.811 throughput=131.0K tks/s lr=0.0000397 time=128.62 INFO:root:[step 603499] mlm_loss=1.44643 mlm_acc=67.64519 nsp_loss=0.03778 nsp_acc=98.646 throughput=126.0K tks/s lr=0.0000397 time=109.96 INFO:root:[step 603749] mlm_loss=1.52264 mlm_acc=67.13690 nsp_loss=0.03361 nsp_acc=98.824 throughput=121.0K tks/s lr=0.0000396 time=118.17 INFO:root:[step 603999] mlm_loss=1.47710 mlm_acc=67.34142 nsp_loss=0.03636 nsp_acc=98.714 throughput=129.0K tks/s lr=0.0000396 time=113.09 INFO:root:[step 604249] mlm_loss=1.50699 mlm_acc=65.62478 nsp_loss=0.08428 nsp_acc=96.645 throughput=129.0K tks/s lr=0.0000396 time=134.35 INFO:root:[step 604499] mlm_loss=1.56543 mlm_acc=64.38663 nsp_loss=0.05406 nsp_acc=97.896 throughput=137.0K tks/s lr=0.0000396 time=132.08 INFO:root:[step 604749] mlm_loss=1.65523 mlm_acc=65.76013 nsp_loss=0.03237 nsp_acc=98.874 throughput=143.0K tks/s lr=0.0000395 time=135.20 INFO:root:[step 604999] mlm_loss=1.79859 mlm_acc=63.35413 nsp_loss=0.03396 nsp_acc=98.757 throughput=153.0K tks/s lr=0.0000395 time=156.07 INFO:root:[step 604999] Saving checkpoints to /home/ubuntu/ckpt-master/0604999.params, /home/ubuntu/ckpt-master/0604999.states. INFO:root:[step 605249] mlm_loss=1.68982 mlm_acc=65.05876 nsp_loss=0.02836 nsp_acc=98.999 throughput=132.0K tks/s lr=0.0000395 time=155.61 INFO:root:[step 605499] mlm_loss=1.58646 mlm_acc=65.61173 nsp_loss=0.03749 nsp_acc=98.620 throughput=132.0K tks/s lr=0.0000395 time=129.20 INFO:root:[step 605749] mlm_loss=1.80323 mlm_acc=62.89988 nsp_loss=0.04467 nsp_acc=98.229 throughput=157.0K tks/s lr=0.0000394 time=159.67 INFO:root:[step 605999] mlm_loss=1.46414 mlm_acc=67.22153 nsp_loss=0.03639 nsp_acc=98.720 throughput=116.0K tks/s lr=0.0000394 time=119.31 INFO:root:[step 606249] mlm_loss=1.59262 mlm_acc=65.32043 nsp_loss=0.05038 nsp_acc=98.089 throughput=141.0K tks/s lr=0.0000394 time=135.68 INFO:root:[step 606499] mlm_loss=1.72983 mlm_acc=63.05114 nsp_loss=0.07004 nsp_acc=97.224 throughput=149.0K tks/s lr=0.0000394 time=154.93 INFO:root:[step 606749] mlm_loss=1.54091 mlm_acc=66.80023 nsp_loss=0.04013 nsp_acc=98.491 throughput=131.0K tks/s lr=0.0000393 time=127.47 INFO:root:[step 606999] mlm_loss=1.69462 mlm_acc=64.35794 nsp_loss=0.06496 nsp_acc=97.393 throughput=154.0K tks/s lr=0.0000393 time=153.58 INFO:root:[step 607249] mlm_loss=1.72739 mlm_acc=62.14736 nsp_loss=0.04755 nsp_acc=98.264 throughput=147.0K tks/s lr=0.0000393 time=151.32 INFO:root:[step 607499] mlm_loss=1.48443 mlm_acc=67.31195 nsp_loss=0.04353 nsp_acc=98.415 throughput=121.0K tks/s lr=0.0000393 time=121.07 INFO:root:[step 607749] mlm_loss=1.54131 mlm_acc=65.90487 nsp_loss=0.10965 nsp_acc=95.369 throughput=131.0K tks/s lr=0.0000392 time=124.16 INFO:root:[step 607999] mlm_loss=1.54730 mlm_acc=66.78614 nsp_loss=0.03377 nsp_acc=98.729 throughput=124.0K tks/s lr=0.0000392 time=125.23 INFO:root:[step 608249] mlm_loss=1.41404 mlm_acc=68.36597 nsp_loss=0.03734 nsp_acc=98.704 throughput=119.0K tks/s lr=0.0000392 time=109.38 INFO:root:[step 608499] mlm_loss=1.46440 mlm_acc=67.71955 nsp_loss=0.03547 nsp_acc=98.735 throughput=125.0K tks/s lr=0.0000392 time=110.07 INFO:root:[step 608749] mlm_loss=1.69759 mlm_acc=64.34288 nsp_loss=0.04917 nsp_acc=98.092 throughput=147.0K tks/s lr=0.0000391 time=156.90 INFO:root:[step 608999] mlm_loss=1.72705 mlm_acc=63.12567 nsp_loss=0.07317 nsp_acc=97.083 throughput=147.0K tks/s lr=0.0000391 time=157.94 INFO:root:[step 609249] mlm_loss=1.44002 mlm_acc=67.79983 nsp_loss=0.03653 nsp_acc=98.703 throughput=121.0K tks/s lr=0.0000391 time=109.78 INFO:root:[step 609499] mlm_loss=1.52972 mlm_acc=66.74695 nsp_loss=0.03287 nsp_acc=98.821 throughput=127.0K tks/s lr=0.0000391 time=126.14 INFO:root:[step 609749] mlm_loss=1.54115 mlm_acc=64.96438 nsp_loss=0.06462 nsp_acc=97.469 throughput=142.0K tks/s lr=0.0000390 time=124.79 INFO:root:[step 609999] mlm_loss=1.85250 mlm_acc=61.73987 nsp_loss=0.07596 nsp_acc=96.923 throughput=143.0K tks/s lr=0.0000390 time=162.53 INFO:root:[step 609999] Saving checkpoints to /home/ubuntu/ckpt-master/0609999.params, /home/ubuntu/ckpt-master/0609999.states. INFO:root:[step 610249] mlm_loss=1.56745 mlm_acc=66.53756 nsp_loss=0.03298 nsp_acc=98.823 throughput=121.0K tks/s lr=0.0000390 time=132.23 INFO:root:[step 610499] mlm_loss=1.74974 mlm_acc=63.66291 nsp_loss=0.04300 nsp_acc=98.369 throughput=143.0K tks/s lr=0.0000390 time=159.79 INFO:root:[step 610749] mlm_loss=1.42090 mlm_acc=66.54645 nsp_loss=0.04323 nsp_acc=98.422 throughput=131.0K tks/s lr=0.0000389 time=113.48 INFO:root:[step 610999] mlm_loss=1.61140 mlm_acc=64.82488 nsp_loss=0.04879 nsp_acc=98.136 throughput=138.0K tks/s lr=0.0000389 time=136.15 INFO:root:[step 611249] mlm_loss=1.51281 mlm_acc=65.79608 nsp_loss=0.05345 nsp_acc=97.970 throughput=135.0K tks/s lr=0.0000389 time=123.62 INFO:root:[step 611499] mlm_loss=1.68178 mlm_acc=64.72885 nsp_loss=0.05930 nsp_acc=97.657 throughput=152.0K tks/s lr=0.0000389 time=164.80 INFO:root:[step 611749] mlm_loss=1.53272 mlm_acc=66.36166 nsp_loss=0.05790 nsp_acc=97.695 throughput=128.0K tks/s lr=0.0000388 time=132.14 INFO:root:[step 611999] mlm_loss=1.43884 mlm_acc=67.85888 nsp_loss=0.03787 nsp_acc=98.645 throughput=121.0K tks/s lr=0.0000388 time=109.98 INFO:root:[step 612249] mlm_loss=1.44914 mlm_acc=67.77405 nsp_loss=0.03323 nsp_acc=98.826 throughput=127.0K tks/s lr=0.0000388 time=112.46 INFO:root:[step 612499] mlm_loss=1.50808 mlm_acc=67.37691 nsp_loss=0.02965 nsp_acc=98.939 throughput=126.0K tks/s lr=0.0000388 time=125.25 INFO:root:[step 612749] mlm_loss=1.42417 mlm_acc=67.99532 nsp_loss=0.03320 nsp_acc=98.839 throughput=122.0K tks/s lr=0.0000387 time=106.98 INFO:root:[step 612999] mlm_loss=1.42225 mlm_acc=68.21937 nsp_loss=0.02976 nsp_acc=98.936 throughput=120.0K tks/s lr=0.0000387 time=121.74 INFO:root:[step 613249] mlm_loss=1.36037 mlm_acc=68.36649 nsp_loss=0.03422 nsp_acc=98.784 throughput=118.0K tks/s lr=0.0000387 time=110.51 INFO:root:[step 613499] mlm_loss=1.34902 mlm_acc=68.70084 nsp_loss=0.03388 nsp_acc=98.873 throughput=121.0K tks/s lr=0.0000387 time=106.47 INFO:root:[step 613749] mlm_loss=1.32891 mlm_acc=68.95636 nsp_loss=0.03292 nsp_acc=98.829 throughput=113.0K tks/s lr=0.0000386 time=112.39 INFO:root:[step 613999] mlm_loss=1.47770 mlm_acc=66.53753 nsp_loss=0.06210 nsp_acc=97.632 throughput=143.0K tks/s lr=0.0000386 time=131.94 INFO:root:[step 614249] mlm_loss=1.63303 mlm_acc=65.78259 nsp_loss=0.02504 nsp_acc=99.091 throughput=141.0K tks/s lr=0.0000386 time=136.80 INFO:root:[step 614499] mlm_loss=1.67551 mlm_acc=65.29943 nsp_loss=0.01966 nsp_acc=99.308 throughput=139.0K tks/s lr=0.0000386 time=154.82 INFO:root:[step 614749] mlm_loss=1.41253 mlm_acc=67.78261 nsp_loss=0.03269 nsp_acc=98.883 throughput=126.0K tks/s lr=0.0000385 time=109.77 INFO:root:[step 614999] mlm_loss=1.49655 mlm_acc=66.43419 nsp_loss=0.05376 nsp_acc=97.917 throughput=137.0K tks/s lr=0.0000385 time=138.46 INFO:root:[step 614999] Saving checkpoints to /home/ubuntu/ckpt-master/0614999.params, /home/ubuntu/ckpt-master/0614999.states. INFO:root:[step 615249] mlm_loss=1.42501 mlm_acc=67.95353 nsp_loss=0.02986 nsp_acc=98.945 throughput=112.0K tks/s lr=0.0000385 time=126.71 INFO:root:[step 615499] mlm_loss=1.46890 mlm_acc=68.59632 nsp_loss=0.06488 nsp_acc=97.464 throughput=145.0K tks/s lr=0.0000385 time=145.33 INFO:root:[step 615749] mlm_loss=1.45302 mlm_acc=69.09163 nsp_loss=0.03197 nsp_acc=98.877 throughput=136.0K tks/s lr=0.0000384 time=136.43 INFO:root:[step 615999] mlm_loss=1.51676 mlm_acc=67.15045 nsp_loss=0.02806 nsp_acc=98.996 throughput=136.0K tks/s lr=0.0000384 time=114.81 INFO:root:[step 616249] mlm_loss=1.51623 mlm_acc=67.09682 nsp_loss=0.02846 nsp_acc=99.009 throughput=125.0K tks/s lr=0.0000384 time=126.01 INFO:root:[step 616499] mlm_loss=1.54940 mlm_acc=66.63359 nsp_loss=0.03554 nsp_acc=98.753 throughput=131.0K tks/s lr=0.0000384 time=126.03 INFO:root:[step 616749] mlm_loss=1.74063 mlm_acc=63.03528 nsp_loss=0.07818 nsp_acc=96.773 throughput=149.0K tks/s lr=0.0000383 time=154.32 INFO:root:[step 616999] mlm_loss=1.41352 mlm_acc=67.60705 nsp_loss=0.04299 nsp_acc=98.402 throughput=123.0K tks/s lr=0.0000383 time=112.02 INFO:root:[step 617249] mlm_loss=1.49796 mlm_acc=66.83592 nsp_loss=0.03440 nsp_acc=98.694 throughput=123.0K tks/s lr=0.0000383 time=125.04 INFO:root:[step 617499] mlm_loss=1.50400 mlm_acc=67.17997 nsp_loss=0.02977 nsp_acc=98.965 throughput=132.0K tks/s lr=0.0000383 time=114.47 INFO:root:[step 617749] mlm_loss=1.68333 mlm_acc=64.27988 nsp_loss=0.06032 nsp_acc=97.612 throughput=139.0K tks/s lr=0.0000382 time=152.35 INFO:root:[step 617999] mlm_loss=1.56025 mlm_acc=65.46806 nsp_loss=0.04821 nsp_acc=98.231 throughput=141.0K tks/s lr=0.0000382 time=121.79 INFO:root:[step 618249] mlm_loss=1.59077 mlm_acc=66.12516 nsp_loss=0.02934 nsp_acc=98.943 throughput=134.0K tks/s lr=0.0000382 time=129.89 INFO:root:[step 618499] mlm_loss=1.44044 mlm_acc=67.91663 nsp_loss=0.03198 nsp_acc=98.857 throughput=122.0K tks/s lr=0.0000382 time=109.43 INFO:root:[step 618749] mlm_loss=1.46491 mlm_acc=67.58435 nsp_loss=0.03223 nsp_acc=98.854 throughput=120.0K tks/s lr=0.0000381 time=120.40 INFO:root:[step 618999] mlm_loss=1.62461 mlm_acc=65.83279 nsp_loss=0.02963 nsp_acc=98.925 throughput=143.0K tks/s lr=0.0000381 time=136.52 INFO:root:[step 619249] mlm_loss=1.45452 mlm_acc=66.69702 nsp_loss=0.05057 nsp_acc=98.083 throughput=136.0K tks/s lr=0.0000381 time=126.73 INFO:root:[step 619499] mlm_loss=1.31120 mlm_acc=72.30486 nsp_loss=0.03983 nsp_acc=98.673 throughput=144.0K tks/s lr=0.0000381 time=141.83 INFO:root:[step 619749] mlm_loss=1.55871 mlm_acc=65.93369 nsp_loss=0.05136 nsp_acc=98.094 throughput=144.0K tks/s lr=0.0000380 time=142.07 INFO:root:[step 619999] mlm_loss=1.70724 mlm_acc=63.54320 nsp_loss=0.02993 nsp_acc=98.889 throughput=143.0K tks/s lr=0.0000380 time=158.56 INFO:root:[step 619999] Saving checkpoints to /home/ubuntu/ckpt-master/0619999.params, /home/ubuntu/ckpt-master/0619999.states. INFO:root:[step 620249] mlm_loss=1.49955 mlm_acc=65.16765 nsp_loss=0.03839 nsp_acc=98.601 throughput=122.0K tks/s lr=0.0000380 time=130.90 INFO:root:[step 620499] mlm_loss=1.61901 mlm_acc=64.00679 nsp_loss=0.04427 nsp_acc=98.293 throughput=141.0K tks/s lr=0.0000380 time=143.37 INFO:root:[step 620749] mlm_loss=1.55676 mlm_acc=65.16808 nsp_loss=0.08710 nsp_acc=96.245 throughput=141.0K tks/s lr=0.0000379 time=136.59 INFO:root:[step 620999] mlm_loss=1.31644 mlm_acc=71.28073 nsp_loss=0.06057 nsp_acc=97.772 throughput=153.0K tks/s lr=0.0000379 time=152.80 INFO:root:[step 621249] mlm_loss=1.71321 mlm_acc=64.25120 nsp_loss=0.03711 nsp_acc=98.595 throughput=155.0K tks/s lr=0.0000379 time=153.41 INFO:root:[step 621499] mlm_loss=1.82314 mlm_acc=62.83602 nsp_loss=0.05279 nsp_acc=97.963 throughput=137.0K tks/s lr=0.0000379 time=135.77 INFO:root:[step 621749] mlm_loss=1.65053 mlm_acc=64.99660 nsp_loss=0.03867 nsp_acc=98.625 throughput=145.0K tks/s lr=0.0000378 time=137.92 INFO:root:[step 621999] mlm_loss=1.48447 mlm_acc=66.22474 nsp_loss=0.03900 nsp_acc=98.591 throughput=122.0K tks/s lr=0.0000378 time=127.49 INFO:root:[step 622249] mlm_loss=1.44341 mlm_acc=67.29229 nsp_loss=0.03396 nsp_acc=98.813 throughput=132.0K tks/s lr=0.0000378 time=111.41 INFO:root:[step 622499] mlm_loss=1.53867 mlm_acc=66.80555 nsp_loss=0.02839 nsp_acc=98.990 throughput=131.0K tks/s lr=0.0000378 time=132.05 INFO:root:[step 622749] mlm_loss=1.48699 mlm_acc=66.26800 nsp_loss=0.05354 nsp_acc=97.965 throughput=139.0K tks/s lr=0.0000377 time=139.66 INFO:root:[step 622999] mlm_loss=1.47825 mlm_acc=67.16277 nsp_loss=0.03140 nsp_acc=98.904 throughput=132.0K tks/s lr=0.0000377 time=115.90 INFO:root:[step 623249] mlm_loss=1.53151 mlm_acc=66.60926 nsp_loss=0.03079 nsp_acc=98.948 throughput=131.0K tks/s lr=0.0000377 time=123.56 INFO:root:[step 623499] mlm_loss=1.60187 mlm_acc=66.01798 nsp_loss=0.02770 nsp_acc=99.026 throughput=136.0K tks/s lr=0.0000377 time=130.46 INFO:root:[step 623749] mlm_loss=1.52180 mlm_acc=66.78518 nsp_loss=0.03128 nsp_acc=98.874 throughput=136.0K tks/s lr=0.0000376 time=119.25 INFO:root:[step 623999] mlm_loss=1.59148 mlm_acc=64.50495 nsp_loss=0.03795 nsp_acc=98.578 throughput=140.0K tks/s lr=0.0000376 time=140.28 INFO:root:[step 624249] mlm_loss=1.77617 mlm_acc=62.65384 nsp_loss=0.04075 nsp_acc=98.467 throughput=153.0K tks/s lr=0.0000376 time=165.15 INFO:root:[step 624499] mlm_loss=1.41570 mlm_acc=67.35632 nsp_loss=0.03477 nsp_acc=98.781 throughput=132.0K tks/s lr=0.0000376 time=119.63 INFO:root:[step 624749] mlm_loss=1.56146 mlm_acc=65.28629 nsp_loss=0.03593 nsp_acc=98.725 throughput=132.0K tks/s lr=0.0000375 time=129.44 INFO:root:[step 624999] mlm_loss=1.81160 mlm_acc=62.49698 nsp_loss=0.05857 nsp_acc=97.659 throughput=154.0K tks/s lr=0.0000375 time=173.31 INFO:root:[step 624999] Saving checkpoints to /home/ubuntu/ckpt-master/0624999.params, /home/ubuntu/ckpt-master/0624999.states. INFO:root:[step 625249] mlm_loss=1.67062 mlm_acc=65.46784 nsp_loss=0.03024 nsp_acc=98.811 throughput=135.0K tks/s lr=0.0000375 time=158.94 INFO:root:[step 625499] mlm_loss=1.32321 mlm_acc=67.54173 nsp_loss=0.06039 nsp_acc=97.712 throughput=121.0K tks/s lr=0.0000375 time=119.05 INFO:root:[step 625749] mlm_loss=1.38974 mlm_acc=68.03113 nsp_loss=0.03548 nsp_acc=98.768 throughput=121.0K tks/s lr=0.0000374 time=107.00 INFO:root:[step 625999] mlm_loss=1.43778 mlm_acc=67.68870 nsp_loss=0.03392 nsp_acc=98.828 throughput=116.0K tks/s lr=0.0000374 time=118.07 INFO:root:[step 626249] mlm_loss=1.62090 mlm_acc=64.48059 nsp_loss=0.04946 nsp_acc=98.119 throughput=147.0K tks/s lr=0.0000374 time=143.98 INFO:root:[step 626499] mlm_loss=1.63824 mlm_acc=64.62318 nsp_loss=0.06939 nsp_acc=97.271 throughput=149.0K tks/s lr=0.0000374 time=151.07 INFO:root:[step 626749] mlm_loss=1.58991 mlm_acc=65.80507 nsp_loss=0.04098 nsp_acc=98.394 throughput=142.0K tks/s lr=0.0000373 time=134.81 INFO:root:[step 626999] mlm_loss=1.74143 mlm_acc=63.13543 nsp_loss=0.07335 nsp_acc=97.079 throughput=157.0K tks/s lr=0.0000373 time=179.98 INFO:root:[step 627249] mlm_loss=1.43658 mlm_acc=68.19810 nsp_loss=0.03127 nsp_acc=98.868 throughput=122.0K tks/s lr=0.0000373 time=110.17 INFO:root:[step 627499] mlm_loss=1.52952 mlm_acc=65.70349 nsp_loss=0.04476 nsp_acc=98.279 throughput=139.0K tks/s lr=0.0000373 time=138.13 INFO:root:[step 627749] mlm_loss=1.48504 mlm_acc=66.20395 nsp_loss=0.04316 nsp_acc=98.435 throughput=143.0K tks/s lr=0.0000372 time=138.07 INFO:root:[step 627999] mlm_loss=1.65502 mlm_acc=65.04308 nsp_loss=0.03870 nsp_acc=98.597 throughput=148.0K tks/s lr=0.0000372 time=147.70 INFO:root:[step 628249] mlm_loss=1.49075 mlm_acc=66.71902 nsp_loss=0.02512 nsp_acc=99.141 throughput=136.0K tks/s lr=0.0000372 time=119.57 INFO:root:[step 628499] mlm_loss=1.70514 mlm_acc=63.82595 nsp_loss=0.02442 nsp_acc=99.121 throughput=145.0K tks/s lr=0.0000372 time=155.59 INFO:root:[step 628749] mlm_loss=1.60387 mlm_acc=65.26270 nsp_loss=0.08214 nsp_acc=96.502 throughput=141.0K tks/s lr=0.0000371 time=140.52 INFO:root:[step 628999] mlm_loss=1.54680 mlm_acc=66.40796 nsp_loss=0.03072 nsp_acc=98.933 throughput=136.0K tks/s lr=0.0000371 time=122.78 INFO:root:[step 629249] mlm_loss=1.68311 mlm_acc=63.74152 nsp_loss=0.03160 nsp_acc=98.877 throughput=146.0K tks/s lr=0.0000371 time=144.23 INFO:root:[step 629499] mlm_loss=1.27744 mlm_acc=68.13827 nsp_loss=0.05183 nsp_acc=98.100 throughput=119.0K tks/s lr=0.0000371 time=120.83 INFO:root:[step 629749] mlm_loss=1.49657 mlm_acc=66.35397 nsp_loss=0.04444 nsp_acc=98.330 throughput=139.0K tks/s lr=0.0000370 time=126.67 INFO:root:[step 629999] mlm_loss=1.38877 mlm_acc=68.32062 nsp_loss=0.03463 nsp_acc=98.750 throughput=110.0K tks/s lr=0.0000370 time=114.85 INFO:root:[step 629999] Saving checkpoints to /home/ubuntu/ckpt-master/0629999.params, /home/ubuntu/ckpt-master/0629999.states. INFO:root:[step 630249] mlm_loss=1.52666 mlm_acc=66.05024 nsp_loss=0.03058 nsp_acc=98.908 throughput=120.0K tks/s lr=0.0000370 time=141.53 INFO:root:[step 630499] mlm_loss=1.64356 mlm_acc=65.89349 nsp_loss=0.02570 nsp_acc=99.102 throughput=144.0K tks/s lr=0.0000370 time=130.10 INFO:root:[step 630749] mlm_loss=1.75815 mlm_acc=63.72802 nsp_loss=0.04903 nsp_acc=98.076 throughput=146.0K tks/s lr=0.0000369 time=156.58 INFO:root:[step 630999] mlm_loss=1.62230 mlm_acc=65.45759 nsp_loss=0.03253 nsp_acc=98.785 throughput=150.0K tks/s lr=0.0000369 time=151.38 INFO:root:[step 631249] mlm_loss=1.41200 mlm_acc=67.99070 nsp_loss=0.03275 nsp_acc=98.890 throughput=124.0K tks/s lr=0.0000369 time=111.81 INFO:root:[step 631499] mlm_loss=1.35596 mlm_acc=68.62751 nsp_loss=0.03622 nsp_acc=98.773 throughput=111.0K tks/s lr=0.0000369 time=115.28 INFO:root:[step 631749] mlm_loss=1.53742 mlm_acc=66.71474 nsp_loss=0.02912 nsp_acc=98.954 throughput=131.0K tks/s lr=0.0000368 time=116.11 INFO:root:[step 631999] mlm_loss=1.66269 mlm_acc=65.74051 nsp_loss=0.02283 nsp_acc=99.190 throughput=143.0K tks/s lr=0.0000368 time=140.26 INFO:root:[step 632249] mlm_loss=1.60132 mlm_acc=65.41987 nsp_loss=0.07608 nsp_acc=96.981 throughput=133.0K tks/s lr=0.0000368 time=136.16 INFO:root:[step 632499] mlm_loss=1.51449 mlm_acc=66.45107 nsp_loss=0.02677 nsp_acc=99.061 throughput=133.0K tks/s lr=0.0000368 time=132.69 INFO:root:[step 632749] mlm_loss=1.61651 mlm_acc=63.63663 nsp_loss=0.03289 nsp_acc=98.805 throughput=139.0K tks/s lr=0.0000367 time=137.43 INFO:root:[step 632999] mlm_loss=1.56515 mlm_acc=66.88481 nsp_loss=0.02526 nsp_acc=99.109 throughput=137.0K tks/s lr=0.0000367 time=117.86 INFO:root:[step 633249] mlm_loss=1.41283 mlm_acc=68.05068 nsp_loss=0.03223 nsp_acc=98.860 throughput=117.0K tks/s lr=0.0000367 time=122.33 INFO:root:[step 633499] mlm_loss=1.41799 mlm_acc=68.05260 nsp_loss=0.03317 nsp_acc=98.786 throughput=125.0K tks/s lr=0.0000367 time=108.48 INFO:root:[step 633749] mlm_loss=1.44531 mlm_acc=67.84432 nsp_loss=0.03160 nsp_acc=98.920 throughput=126.0K tks/s lr=0.0000366 time=113.52 INFO:root:[step 633999] mlm_loss=1.52469 mlm_acc=67.03747 nsp_loss=0.03128 nsp_acc=98.905 throughput=126.0K tks/s lr=0.0000366 time=125.58 INFO:root:[step 634249] mlm_loss=1.48687 mlm_acc=67.80797 nsp_loss=0.03322 nsp_acc=98.808 throughput=127.0K tks/s lr=0.0000366 time=114.24 INFO:root:[step 634499] mlm_loss=1.54494 mlm_acc=67.31682 nsp_loss=0.02485 nsp_acc=99.134 throughput=131.0K tks/s lr=0.0000366 time=127.64 INFO:root:[step 634749] mlm_loss=1.58993 mlm_acc=66.17461 nsp_loss=0.03748 nsp_acc=98.644 throughput=135.0K tks/s lr=0.0000365 time=133.77 INFO:root:[step 634999] mlm_loss=1.56704 mlm_acc=65.67485 nsp_loss=0.04380 nsp_acc=98.330 throughput=137.0K tks/s lr=0.0000365 time=143.20 INFO:root:[step 634999] Saving checkpoints to /home/ubuntu/ckpt-master/0634999.params, /home/ubuntu/ckpt-master/0634999.states. INFO:root:[step 635249] mlm_loss=1.32891 mlm_acc=68.69655 nsp_loss=0.03767 nsp_acc=98.674 throughput=103.0K tks/s lr=0.0000365 time=120.99 INFO:root:[step 635499] mlm_loss=1.41521 mlm_acc=67.93276 nsp_loss=0.02916 nsp_acc=99.002 throughput=127.0K tks/s lr=0.0000365 time=110.55 INFO:root:[step 635749] mlm_loss=1.70796 mlm_acc=64.57609 nsp_loss=0.02907 nsp_acc=98.938 throughput=146.0K tks/s lr=0.0000364 time=154.68 INFO:root:[step 635999] mlm_loss=1.47272 mlm_acc=66.24425 nsp_loss=0.04831 nsp_acc=98.254 throughput=131.0K tks/s lr=0.0000364 time=131.99 INFO:root:[step 636249] mlm_loss=1.52001 mlm_acc=66.69347 nsp_loss=0.02768 nsp_acc=99.015 throughput=134.0K tks/s lr=0.0000364 time=123.47 INFO:root:[step 636499] mlm_loss=1.54936 mlm_acc=66.53897 nsp_loss=0.03420 nsp_acc=98.776 throughput=132.0K tks/s lr=0.0000364 time=127.85 INFO:root:[step 636749] mlm_loss=1.49565 mlm_acc=65.74782 nsp_loss=0.04202 nsp_acc=98.448 throughput=131.0K tks/s lr=0.0000363 time=120.18 INFO:root:[step 636999] mlm_loss=1.60661 mlm_acc=63.84923 nsp_loss=0.04549 nsp_acc=98.314 throughput=137.0K tks/s lr=0.0000363 time=137.11 INFO:root:[step 637249] mlm_loss=1.41263 mlm_acc=69.39229 nsp_loss=0.03824 nsp_acc=98.642 throughput=127.0K tks/s lr=0.0000363 time=122.36 INFO:root:[step 637499] mlm_loss=1.26983 mlm_acc=72.83024 nsp_loss=0.04354 nsp_acc=98.474 throughput=137.0K tks/s lr=0.0000363 time=120.95 INFO:root:[step 637749] mlm_loss=1.64209 mlm_acc=64.74184 nsp_loss=0.03469 nsp_acc=98.724 throughput=140.0K tks/s lr=0.0000362 time=134.25 INFO:root:[step 637999] mlm_loss=1.38584 mlm_acc=67.34497 nsp_loss=0.04165 nsp_acc=98.534 throughput=129.0K tks/s lr=0.0000362 time=126.24 INFO:root:[step 638249] mlm_loss=1.72643 mlm_acc=63.16274 nsp_loss=0.04430 nsp_acc=98.321 throughput=147.0K tks/s lr=0.0000362 time=148.59 INFO:root:[step 638499] mlm_loss=1.58502 mlm_acc=64.50201 nsp_loss=0.04588 nsp_acc=98.265 throughput=150.0K tks/s lr=0.0000362 time=148.77 INFO:root:[step 638749] mlm_loss=1.46861 mlm_acc=66.86888 nsp_loss=0.03720 nsp_acc=98.638 throughput=128.0K tks/s lr=0.0000361 time=128.29 INFO:root:[step 638999] mlm_loss=1.64949 mlm_acc=65.70123 nsp_loss=0.02419 nsp_acc=99.108 throughput=139.0K tks/s lr=0.0000361 time=139.44 INFO:root:[step 639249] mlm_loss=1.50759 mlm_acc=66.57107 nsp_loss=0.03083 nsp_acc=98.981 throughput=137.0K tks/s lr=0.0000361 time=116.99 INFO:root:[step 639499] mlm_loss=1.49474 mlm_acc=67.03127 nsp_loss=0.03387 nsp_acc=98.779 throughput=119.0K tks/s lr=0.0000361 time=122.78 INFO:root:[step 639749] mlm_loss=1.49387 mlm_acc=67.10397 nsp_loss=0.03601 nsp_acc=98.690 throughput=129.0K tks/s lr=0.0000360 time=113.84 INFO:root:[step 639999] mlm_loss=1.62494 mlm_acc=65.91418 nsp_loss=0.02539 nsp_acc=99.091 throughput=141.0K tks/s lr=0.0000360 time=135.78 INFO:root:[step 639999] Saving checkpoints to /home/ubuntu/ckpt-master/0639999.params, /home/ubuntu/ckpt-master/0639999.states. INFO:root:[step 640249] mlm_loss=1.41535 mlm_acc=67.67690 nsp_loss=0.03615 nsp_acc=98.737 throughput=102.0K tks/s lr=0.0000360 time=135.51 INFO:root:[step 640499] mlm_loss=1.27832 mlm_acc=68.69300 nsp_loss=0.04752 nsp_acc=98.319 throughput=110.0K tks/s lr=0.0000360 time=105.86 INFO:root:[step 640749] mlm_loss=1.41384 mlm_acc=67.72143 nsp_loss=0.04321 nsp_acc=98.360 throughput=118.0K tks/s lr=0.0000359 time=108.08 INFO:root:[step 640999] mlm_loss=1.59563 mlm_acc=66.32564 nsp_loss=0.02571 nsp_acc=99.089 throughput=138.0K tks/s lr=0.0000359 time=134.79 INFO:root:[step 641249] mlm_loss=1.70322 mlm_acc=64.16566 nsp_loss=0.03369 nsp_acc=98.726 throughput=145.0K tks/s lr=0.0000359 time=143.48 INFO:root:[step 641499] mlm_loss=1.59949 mlm_acc=65.63230 nsp_loss=0.08771 nsp_acc=96.306 throughput=132.0K tks/s lr=0.0000359 time=137.56 INFO:root:[step 641749] mlm_loss=1.41432 mlm_acc=66.04008 nsp_loss=0.06569 nsp_acc=97.450 throughput=134.0K tks/s lr=0.0000358 time=116.03 INFO:root:[step 641999] mlm_loss=1.83415 mlm_acc=62.08904 nsp_loss=0.06483 nsp_acc=97.371 throughput=155.0K tks/s lr=0.0000358 time=170.15 INFO:root:[step 642249] mlm_loss=1.48171 mlm_acc=65.74203 nsp_loss=0.05651 nsp_acc=97.831 throughput=136.0K tks/s lr=0.0000358 time=126.55 INFO:root:[step 642499] mlm_loss=1.63077 mlm_acc=65.98077 nsp_loss=0.02668 nsp_acc=99.037 throughput=136.0K tks/s lr=0.0000358 time=135.76 INFO:root:[step 642749] mlm_loss=1.62486 mlm_acc=65.59530 nsp_loss=0.05943 nsp_acc=97.535 throughput=146.0K tks/s lr=0.0000357 time=155.36 INFO:root:[step 642999] mlm_loss=1.45931 mlm_acc=67.21719 nsp_loss=0.04168 nsp_acc=98.545 throughput=135.0K tks/s lr=0.0000357 time=121.71 INFO:root:[step 643249] mlm_loss=1.36087 mlm_acc=68.76466 nsp_loss=0.03963 nsp_acc=98.617 throughput=120.0K tks/s lr=0.0000357 time=108.57 INFO:root:[step 643499] mlm_loss=1.65984 mlm_acc=65.72666 nsp_loss=0.02479 nsp_acc=99.123 throughput=142.0K tks/s lr=0.0000357 time=137.30 INFO:root:[step 643749] mlm_loss=1.86384 mlm_acc=61.92238 nsp_loss=0.07658 nsp_acc=96.867 throughput=145.0K tks/s lr=0.0000356 time=160.67 INFO:root:[step 643999] mlm_loss=1.72805 mlm_acc=63.89847 nsp_loss=0.08440 nsp_acc=96.645 throughput=146.0K tks/s lr=0.0000356 time=153.17 INFO:root:[step 644249] mlm_loss=1.38841 mlm_acc=68.06578 nsp_loss=0.03626 nsp_acc=98.740 throughput=118.0K tks/s lr=0.0000356 time=107.11 INFO:root:[step 644499] mlm_loss=1.40557 mlm_acc=68.29517 nsp_loss=0.03387 nsp_acc=98.818 throughput=117.0K tks/s lr=0.0000356 time=108.10 INFO:root:[step 644749] mlm_loss=1.65470 mlm_acc=63.89815 nsp_loss=0.04808 nsp_acc=98.171 throughput=136.0K tks/s lr=0.0000355 time=134.98 INFO:root:[step 644999] mlm_loss=1.41661 mlm_acc=68.02228 nsp_loss=0.03640 nsp_acc=98.702 throughput=128.0K tks/s lr=0.0000355 time=110.75 INFO:root:[step 644999] Saving checkpoints to /home/ubuntu/ckpt-master/0644999.params, /home/ubuntu/ckpt-master/0644999.states. INFO:root:[step 645249] mlm_loss=1.48208 mlm_acc=67.51958 nsp_loss=0.03165 nsp_acc=98.869 throughput=113.0K tks/s lr=0.0000355 time=135.73 INFO:root:[step 645499] mlm_loss=1.70286 mlm_acc=64.84374 nsp_loss=0.03626 nsp_acc=98.636 throughput=147.0K tks/s lr=0.0000355 time=144.91 INFO:root:[step 645749] mlm_loss=1.54284 mlm_acc=66.18315 nsp_loss=0.03796 nsp_acc=98.644 throughput=124.0K tks/s lr=0.0000354 time=128.29 INFO:root:[step 645999] mlm_loss=1.40591 mlm_acc=68.17518 nsp_loss=0.03079 nsp_acc=98.927 throughput=121.0K tks/s lr=0.0000354 time=110.63 INFO:root:[step 646249] mlm_loss=1.63908 mlm_acc=63.82588 nsp_loss=0.04611 nsp_acc=98.217 throughput=151.0K tks/s lr=0.0000354 time=146.81 INFO:root:[step 646499] mlm_loss=1.73744 mlm_acc=62.98634 nsp_loss=0.05336 nsp_acc=97.972 throughput=151.0K tks/s lr=0.0000354 time=172.55 INFO:root:[step 646749] mlm_loss=1.49361 mlm_acc=65.83537 nsp_loss=0.04474 nsp_acc=98.339 throughput=139.0K tks/s lr=0.0000353 time=138.96 INFO:root:[step 646999] mlm_loss=1.45009 mlm_acc=66.36256 nsp_loss=0.04873 nsp_acc=98.138 throughput=128.0K tks/s lr=0.0000353 time=115.60 INFO:root:[step 647249] mlm_loss=1.60015 mlm_acc=65.19438 nsp_loss=0.03794 nsp_acc=98.583 throughput=129.0K tks/s lr=0.0000353 time=128.56 INFO:root:[step 647499] mlm_loss=1.59289 mlm_acc=66.62438 nsp_loss=0.02592 nsp_acc=99.131 throughput=141.0K tks/s lr=0.0000353 time=122.89 INFO:root:[step 647749] mlm_loss=1.45391 mlm_acc=67.35185 nsp_loss=0.03350 nsp_acc=98.813 throughput=123.0K tks/s lr=0.0000352 time=120.18 INFO:root:[step 647999] mlm_loss=1.77394 mlm_acc=63.19345 nsp_loss=0.02531 nsp_acc=99.099 throughput=157.0K tks/s lr=0.0000352 time=157.98 INFO:root:[step 648249] mlm_loss=1.46465 mlm_acc=66.93386 nsp_loss=0.03526 nsp_acc=98.721 throughput=116.0K tks/s lr=0.0000352 time=122.64 INFO:root:[step 648499] mlm_loss=1.36633 mlm_acc=68.29460 nsp_loss=0.04116 nsp_acc=98.577 throughput=119.0K tks/s lr=0.0000352 time=106.32 INFO:root:[step 648749] mlm_loss=1.34632 mlm_acc=68.76510 nsp_loss=0.03417 nsp_acc=98.832 throughput=118.0K tks/s lr=0.0000351 time=107.41 INFO:root:[step 648999] mlm_loss=1.58454 mlm_acc=66.40109 nsp_loss=0.02801 nsp_acc=98.996 throughput=132.0K tks/s lr=0.0000351 time=129.71 INFO:root:[step 649249] mlm_loss=1.42613 mlm_acc=67.97467 nsp_loss=0.03114 nsp_acc=98.901 throughput=124.0K tks/s lr=0.0000351 time=111.88 INFO:root:[step 649499] mlm_loss=1.36998 mlm_acc=68.26488 nsp_loss=0.04197 nsp_acc=98.468 throughput=107.0K tks/s lr=0.0000351 time=114.63 INFO:root:[step 649749] mlm_loss=1.36246 mlm_acc=68.20187 nsp_loss=0.03590 nsp_acc=98.714 throughput=123.0K tks/s lr=0.0000350 time=107.42 INFO:root:[step 649999] mlm_loss=1.47896 mlm_acc=67.38013 nsp_loss=0.03064 nsp_acc=98.931 throughput=129.0K tks/s lr=0.0000350 time=115.72 INFO:root:[step 649999] Saving checkpoints to /home/ubuntu/ckpt-master/0649999.params, /home/ubuntu/ckpt-master/0649999.states. INFO:root:[step 650249] mlm_loss=1.43434 mlm_acc=66.99736 nsp_loss=0.04822 nsp_acc=98.192 throughput=96.0K tks/s lr=0.0000350 time=131.69 INFO:root:[step 650499] mlm_loss=1.69628 mlm_acc=63.57325 nsp_loss=0.05324 nsp_acc=97.964 throughput=131.0K tks/s lr=0.0000350 time=120.16 INFO:root:[step 650749] mlm_loss=1.61766 mlm_acc=65.25500 nsp_loss=0.09788 nsp_acc=95.828 throughput=129.0K tks/s lr=0.0000349 time=130.33 INFO:root:[step 650999] mlm_loss=1.54451 mlm_acc=66.96835 nsp_loss=0.02777 nsp_acc=99.004 throughput=141.0K tks/s lr=0.0000349 time=133.64 INFO:root:[step 651249] mlm_loss=1.62664 mlm_acc=65.92398 nsp_loss=0.02639 nsp_acc=99.042 throughput=138.0K tks/s lr=0.0000349 time=136.35 INFO:root:[step 651499] mlm_loss=1.62114 mlm_acc=66.01300 nsp_loss=0.02835 nsp_acc=98.987 throughput=137.0K tks/s lr=0.0000349 time=136.09 INFO:root:[step 651749] mlm_loss=1.52164 mlm_acc=65.43909 nsp_loss=0.03792 nsp_acc=98.582 throughput=146.0K tks/s lr=0.0000348 time=124.26 INFO:root:[step 651999] mlm_loss=1.49019 mlm_acc=65.83624 nsp_loss=0.03354 nsp_acc=98.807 throughput=130.0K tks/s lr=0.0000348 time=129.01 INFO:root:[step 652249] mlm_loss=1.63831 mlm_acc=65.24599 nsp_loss=0.04121 nsp_acc=98.475 throughput=157.0K tks/s lr=0.0000348 time=170.92 INFO:root:[step 652499] mlm_loss=1.57405 mlm_acc=65.72974 nsp_loss=0.04383 nsp_acc=98.320 throughput=147.0K tks/s lr=0.0000348 time=132.96 INFO:root:[step 652749] mlm_loss=1.39599 mlm_acc=68.48491 nsp_loss=0.03251 nsp_acc=98.857 throughput=114.0K tks/s lr=0.0000347 time=116.67 INFO:root:[step 652999] mlm_loss=1.71786 mlm_acc=63.49287 nsp_loss=0.06764 nsp_acc=97.313 throughput=140.0K tks/s lr=0.0000347 time=121.09 INFO:root:[step 653249] mlm_loss=1.36584 mlm_acc=68.06014 nsp_loss=0.04194 nsp_acc=98.470 throughput=106.0K tks/s lr=0.0000347 time=116.84 INFO:root:[step 653499] mlm_loss=1.44484 mlm_acc=67.91184 nsp_loss=0.03414 nsp_acc=98.794 throughput=127.0K tks/s lr=0.0000347 time=110.73 INFO:root:[step 653749] mlm_loss=1.65124 mlm_acc=63.93517 nsp_loss=0.03805 nsp_acc=98.610 throughput=144.0K tks/s lr=0.0000346 time=139.46 INFO:root:[step 653999] mlm_loss=1.67417 mlm_acc=64.77813 nsp_loss=0.04188 nsp_acc=98.364 throughput=151.0K tks/s lr=0.0000346 time=148.18 INFO:root:[step 654249] mlm_loss=1.59030 mlm_acc=65.72373 nsp_loss=0.03315 nsp_acc=98.744 throughput=138.0K tks/s lr=0.0000346 time=135.35 INFO:root:[step 654499] mlm_loss=1.47425 mlm_acc=67.42443 nsp_loss=0.03373 nsp_acc=98.774 throughput=118.0K tks/s lr=0.0000346 time=121.97 INFO:root:[step 654749] mlm_loss=1.40003 mlm_acc=70.00848 nsp_loss=0.03965 nsp_acc=98.597 throughput=141.0K tks/s lr=0.0000345 time=123.90 INFO:root:[step 654999] mlm_loss=1.49871 mlm_acc=67.92951 nsp_loss=0.03550 nsp_acc=98.718 throughput=126.0K tks/s lr=0.0000345 time=127.64 INFO:root:[step 654999] Saving checkpoints to /home/ubuntu/ckpt-master/0654999.params, /home/ubuntu/ckpt-master/0654999.states. INFO:root:[step 655249] mlm_loss=1.40060 mlm_acc=68.30856 nsp_loss=0.03811 nsp_acc=98.624 throughput=108.0K tks/s lr=0.0000345 time=123.40 INFO:root:[step 655499] mlm_loss=1.55648 mlm_acc=65.00647 nsp_loss=0.05210 nsp_acc=98.084 throughput=133.0K tks/s lr=0.0000345 time=135.20 INFO:root:[step 655749] mlm_loss=1.38631 mlm_acc=68.34271 nsp_loss=0.03800 nsp_acc=98.638 throughput=118.0K tks/s lr=0.0000344 time=105.18 INFO:root:[step 655999] mlm_loss=1.54967 mlm_acc=66.55825 nsp_loss=0.02967 nsp_acc=98.941 throughput=134.0K tks/s lr=0.0000344 time=128.09 INFO:root:[step 656249] mlm_loss=1.48016 mlm_acc=67.14101 nsp_loss=0.02957 nsp_acc=98.952 throughput=131.0K tks/s lr=0.0000344 time=116.91 INFO:root:[step 656499] mlm_loss=1.49299 mlm_acc=67.39601 nsp_loss=0.03039 nsp_acc=98.890 throughput=120.0K tks/s lr=0.0000344 time=122.53 INFO:root:[step 656749] mlm_loss=1.43604 mlm_acc=67.77482 nsp_loss=0.03608 nsp_acc=98.684 throughput=125.0K tks/s lr=0.0000343 time=110.90 INFO:root:[step 656999] mlm_loss=1.61021 mlm_acc=64.66929 nsp_loss=0.03809 nsp_acc=98.600 throughput=139.0K tks/s lr=0.0000343 time=136.66 INFO:root:[step 657249] mlm_loss=1.55103 mlm_acc=65.98566 nsp_loss=0.02921 nsp_acc=99.001 throughput=135.0K tks/s lr=0.0000343 time=136.71 INFO:root:[step 657499] mlm_loss=1.58165 mlm_acc=64.85586 nsp_loss=0.03164 nsp_acc=98.877 throughput=147.0K tks/s lr=0.0000343 time=139.82 INFO:root:[step 657749] mlm_loss=1.46732 mlm_acc=67.47786 nsp_loss=0.03086 nsp_acc=98.924 throughput=119.0K tks/s lr=0.0000342 time=122.04 INFO:root:[step 657999] mlm_loss=1.54963 mlm_acc=66.39747 nsp_loss=0.06235 nsp_acc=97.556 throughput=140.0K tks/s lr=0.0000342 time=120.25 INFO:root:[step 658249] mlm_loss=1.29098 mlm_acc=68.12894 nsp_loss=0.05902 nsp_acc=97.878 throughput=116.0K tks/s lr=0.0000342 time=119.71 INFO:root:[step 658499] mlm_loss=1.74607 mlm_acc=63.76594 nsp_loss=0.05400 nsp_acc=97.941 throughput=144.0K tks/s lr=0.0000342 time=129.37 INFO:root:[step 658749] mlm_loss=1.66400 mlm_acc=65.05474 nsp_loss=0.04749 nsp_acc=98.137 throughput=144.0K tks/s lr=0.0000341 time=153.46 INFO:root:[step 658999] mlm_loss=1.56731 mlm_acc=66.60382 nsp_loss=0.02591 nsp_acc=99.067 throughput=143.0K tks/s lr=0.0000341 time=127.98 INFO:root:[step 659249] mlm_loss=1.43511 mlm_acc=67.58529 nsp_loss=0.03323 nsp_acc=98.827 throughput=120.0K tks/s lr=0.0000341 time=120.21 INFO:root:[step 659499] mlm_loss=1.64045 mlm_acc=65.94949 nsp_loss=0.02718 nsp_acc=99.022 throughput=137.0K tks/s lr=0.0000341 time=135.72 INFO:root:[step 659749] mlm_loss=1.63884 mlm_acc=65.68914 nsp_loss=0.04058 nsp_acc=98.434 throughput=142.0K tks/s lr=0.0000340 time=136.37 INFO:root:[step 659999] mlm_loss=1.46682 mlm_acc=66.35924 nsp_loss=0.06461 nsp_acc=97.484 throughput=134.0K tks/s lr=0.0000340 time=122.06 INFO:root:[step 659999] Saving checkpoints to /home/ubuntu/ckpt-master/0659999.params, /home/ubuntu/ckpt-master/0659999.states. INFO:root:[step 660249] mlm_loss=1.38766 mlm_acc=68.43806 nsp_loss=0.03870 nsp_acc=98.609 throughput=103.0K tks/s lr=0.0000340 time=129.33 INFO:root:[step 660499] mlm_loss=1.66081 mlm_acc=65.25836 nsp_loss=0.05706 nsp_acc=97.703 throughput=154.0K tks/s lr=0.0000340 time=157.90 INFO:root:[step 660749] mlm_loss=1.63326 mlm_acc=65.35901 nsp_loss=0.04781 nsp_acc=98.106 throughput=139.0K tks/s lr=0.0000339 time=141.08 INFO:root:[step 660999] mlm_loss=1.48446 mlm_acc=67.38308 nsp_loss=0.03213 nsp_acc=98.838 throughput=134.0K tks/s lr=0.0000339 time=114.23 INFO:root:[step 661249] mlm_loss=1.49594 mlm_acc=67.31201 nsp_loss=0.03371 nsp_acc=98.803 throughput=121.0K tks/s lr=0.0000339 time=123.42 INFO:root:[step 661499] mlm_loss=1.46865 mlm_acc=67.57170 nsp_loss=0.03212 nsp_acc=98.871 throughput=130.0K tks/s lr=0.0000339 time=111.96 INFO:root:[step 661749] mlm_loss=1.41754 mlm_acc=67.92902 nsp_loss=0.03814 nsp_acc=98.636 throughput=111.0K tks/s lr=0.0000338 time=115.50 INFO:root:[step 661999] mlm_loss=1.53082 mlm_acc=66.85635 nsp_loss=0.02933 nsp_acc=98.925 throughput=135.0K tks/s lr=0.0000338 time=118.62 INFO:root:[step 662249] mlm_loss=1.61713 mlm_acc=65.21018 nsp_loss=0.04129 nsp_acc=98.421 throughput=141.0K tks/s lr=0.0000338 time=135.73 INFO:root:[step 662499] mlm_loss=1.54353 mlm_acc=66.02665 nsp_loss=0.04595 nsp_acc=98.232 throughput=127.0K tks/s lr=0.0000338 time=128.22 INFO:root:[step 662749] mlm_loss=1.53354 mlm_acc=66.20147 nsp_loss=0.05019 nsp_acc=98.072 throughput=140.0K tks/s lr=0.0000337 time=142.14 INFO:root:[step 662999] mlm_loss=1.44024 mlm_acc=66.01082 nsp_loss=0.05550 nsp_acc=97.944 throughput=136.0K tks/s lr=0.0000337 time=117.12 INFO:root:[step 663249] mlm_loss=1.66964 mlm_acc=63.07500 nsp_loss=0.06912 nsp_acc=97.287 throughput=129.0K tks/s lr=0.0000337 time=140.09 INFO:root:[step 663499] mlm_loss=1.29572 mlm_acc=68.84138 nsp_loss=0.04095 nsp_acc=98.548 throughput=115.0K tks/s lr=0.0000337 time=104.37 INFO:root:[step 663749] mlm_loss=1.59029 mlm_acc=66.23217 nsp_loss=0.02954 nsp_acc=98.948 throughput=135.0K tks/s lr=0.0000336 time=129.58 INFO:root:[step 663999] mlm_loss=1.59468 mlm_acc=66.20273 nsp_loss=0.03955 nsp_acc=98.559 throughput=134.0K tks/s lr=0.0000336 time=128.23 INFO:root:[step 664249] mlm_loss=1.66465 mlm_acc=64.13454 nsp_loss=0.14040 nsp_acc=93.934 throughput=146.0K tks/s lr=0.0000336 time=146.58 INFO:root:[step 664499] mlm_loss=1.57281 mlm_acc=65.71128 nsp_loss=0.04663 nsp_acc=98.268 throughput=145.0K tks/s lr=0.0000336 time=132.79 INFO:root:[step 664749] mlm_loss=1.50130 mlm_acc=67.19809 nsp_loss=0.03128 nsp_acc=98.913 throughput=122.0K tks/s lr=0.0000335 time=121.95 INFO:root:[step 664999] mlm_loss=1.62590 mlm_acc=66.22750 nsp_loss=0.02702 nsp_acc=99.035 throughput=136.0K tks/s lr=0.0000335 time=131.85 INFO:root:[step 664999] Saving checkpoints to /home/ubuntu/ckpt-master/0664999.params, /home/ubuntu/ckpt-master/0664999.states. INFO:root:[step 665249] mlm_loss=1.63590 mlm_acc=66.00921 nsp_loss=0.02424 nsp_acc=99.140 throughput=126.0K tks/s lr=0.0000335 time=150.07 INFO:root:[step 665499] mlm_loss=1.50591 mlm_acc=66.91681 nsp_loss=0.03016 nsp_acc=98.930 throughput=137.0K tks/s lr=0.0000335 time=122.10 INFO:root:[step 665749] mlm_loss=1.51921 mlm_acc=66.19717 nsp_loss=0.03111 nsp_acc=98.892 throughput=133.0K tks/s lr=0.0000334 time=130.95 INFO:root:[step 665999] mlm_loss=1.53669 mlm_acc=66.81797 nsp_loss=0.03052 nsp_acc=98.919 throughput=129.0K tks/s lr=0.0000334 time=125.74 INFO:root:[step 666249] mlm_loss=1.50674 mlm_acc=67.26091 nsp_loss=0.03197 nsp_acc=98.857 throughput=131.0K tks/s lr=0.0000334 time=113.37 INFO:root:[step 666499] mlm_loss=1.54519 mlm_acc=66.82516 nsp_loss=0.03141 nsp_acc=98.870 throughput=129.0K tks/s lr=0.0000334 time=126.66 INFO:root:[step 666749] mlm_loss=1.37955 mlm_acc=68.60825 nsp_loss=0.03454 nsp_acc=98.770 throughput=122.0K tks/s lr=0.0000333 time=107.42 INFO:root:[step 666999] mlm_loss=1.82313 mlm_acc=62.27507 nsp_loss=0.06637 nsp_acc=97.399 throughput=122.0K tks/s lr=0.0000333 time=126.56 INFO:root:[step 667249] mlm_loss=1.60885 mlm_acc=65.23354 nsp_loss=0.06047 nsp_acc=97.676 throughput=146.0K tks/s lr=0.0000333 time=127.68 INFO:root:[step 667499] mlm_loss=1.53910 mlm_acc=66.90728 nsp_loss=0.03325 nsp_acc=98.812 throughput=127.0K tks/s lr=0.0000333 time=127.00 INFO:root:[step 667749] mlm_loss=1.59761 mlm_acc=65.67838 nsp_loss=0.04206 nsp_acc=98.462 throughput=141.0K tks/s lr=0.0000332 time=133.92 INFO:root:[step 667999] mlm_loss=1.62181 mlm_acc=65.39847 nsp_loss=0.04421 nsp_acc=98.257 throughput=139.0K tks/s lr=0.0000332 time=143.10 INFO:root:[step 668249] mlm_loss=1.42643 mlm_acc=68.34908 nsp_loss=0.03369 nsp_acc=98.852 throughput=122.0K tks/s lr=0.0000332 time=108.24 INFO:root:[step 668499] mlm_loss=1.49598 mlm_acc=67.47022 nsp_loss=0.03156 nsp_acc=98.852 throughput=125.0K tks/s lr=0.0000332 time=120.10 INFO:root:[step 668749] mlm_loss=1.63615 mlm_acc=65.00641 nsp_loss=0.08407 nsp_acc=96.441 throughput=139.0K tks/s lr=0.0000331 time=139.85 INFO:root:[step 668999] mlm_loss=1.41054 mlm_acc=67.94378 nsp_loss=0.03741 nsp_acc=98.680 throughput=125.0K tks/s lr=0.0000331 time=107.44 INFO:root:[step 669249] mlm_loss=1.61447 mlm_acc=66.52093 nsp_loss=0.02807 nsp_acc=98.943 throughput=133.0K tks/s lr=0.0000331 time=132.62 INFO:root:[step 669499] mlm_loss=1.59279 mlm_acc=64.30523 nsp_loss=0.04114 nsp_acc=98.516 throughput=141.0K tks/s lr=0.0000331 time=137.43 INFO:root:[step 669749] mlm_loss=1.63969 mlm_acc=65.57224 nsp_loss=0.02519 nsp_acc=99.064 throughput=143.0K tks/s lr=0.0000330 time=137.57 INFO:root:[step 669999] mlm_loss=1.65217 mlm_acc=63.65558 nsp_loss=0.04066 nsp_acc=98.506 throughput=143.0K tks/s lr=0.0000330 time=132.53 INFO:root:[step 669999] Saving checkpoints to /home/ubuntu/ckpt-master/0669999.params, /home/ubuntu/ckpt-master/0669999.states. INFO:root:[step 670249] mlm_loss=1.46714 mlm_acc=67.47406 nsp_loss=0.03499 nsp_acc=98.756 throughput=103.0K tks/s lr=0.0000330 time=134.18 INFO:root:[step 670499] mlm_loss=1.39672 mlm_acc=68.24007 nsp_loss=0.03644 nsp_acc=98.752 throughput=123.0K tks/s lr=0.0000330 time=109.71 INFO:root:[step 670749] mlm_loss=1.59413 mlm_acc=65.37980 nsp_loss=0.05140 nsp_acc=98.032 throughput=145.0K tks/s lr=0.0000329 time=139.82 INFO:root:[step 670999] mlm_loss=1.56382 mlm_acc=66.10400 nsp_loss=0.03697 nsp_acc=98.568 throughput=134.0K tks/s lr=0.0000329 time=134.89 INFO:root:[step 671249] mlm_loss=1.35743 mlm_acc=68.96311 nsp_loss=0.03576 nsp_acc=98.766 throughput=115.0K tks/s lr=0.0000329 time=105.52 INFO:root:[step 671499] mlm_loss=1.50814 mlm_acc=67.23681 nsp_loss=0.03149 nsp_acc=98.895 throughput=125.0K tks/s lr=0.0000329 time=123.85 INFO:root:[step 671749] mlm_loss=1.51498 mlm_acc=67.20409 nsp_loss=0.03100 nsp_acc=98.887 throughput=132.0K tks/s lr=0.0000328 time=115.59 INFO:root:[step 671999] mlm_loss=1.78352 mlm_acc=63.15514 nsp_loss=0.03772 nsp_acc=98.611 throughput=150.0K tks/s lr=0.0000328 time=158.20 INFO:root:[step 672249] mlm_loss=1.74390 mlm_acc=64.07106 nsp_loss=0.04182 nsp_acc=98.374 throughput=154.0K tks/s lr=0.0000328 time=152.86 INFO:root:[step 672499] mlm_loss=1.36853 mlm_acc=68.23205 nsp_loss=0.03626 nsp_acc=98.712 throughput=123.0K tks/s lr=0.0000328 time=112.59 INFO:root:[step 672749] mlm_loss=1.58572 mlm_acc=65.70595 nsp_loss=0.05001 nsp_acc=98.124 throughput=146.0K tks/s lr=0.0000327 time=141.84 INFO:root:[step 672999] mlm_loss=1.68215 mlm_acc=64.71910 nsp_loss=0.04760 nsp_acc=98.123 throughput=145.0K tks/s lr=0.0000327 time=142.85 INFO:root:[step 673249] mlm_loss=1.53487 mlm_acc=66.78230 nsp_loss=0.03100 nsp_acc=98.930 throughput=126.0K tks/s lr=0.0000327 time=125.71 INFO:root:[step 673499] mlm_loss=1.56948 mlm_acc=66.63390 nsp_loss=0.03142 nsp_acc=98.871 throughput=128.0K tks/s lr=0.0000327 time=127.03 INFO:root:[step 673749] mlm_loss=1.67434 mlm_acc=64.57056 nsp_loss=0.04373 nsp_acc=98.369 throughput=146.0K tks/s lr=0.0000326 time=150.06 INFO:root:[step 673999] mlm_loss=1.45643 mlm_acc=67.72130 nsp_loss=0.03150 nsp_acc=98.879 throughput=127.0K tks/s lr=0.0000326 time=113.19 INFO:root:[step 674249] mlm_loss=1.49196 mlm_acc=67.87191 nsp_loss=0.03015 nsp_acc=98.968 throughput=125.0K tks/s lr=0.0000326 time=126.44 INFO:root:[step 674499] mlm_loss=1.52349 mlm_acc=65.37915 nsp_loss=0.06056 nsp_acc=97.630 throughput=143.0K tks/s lr=0.0000326 time=137.01 INFO:root:[step 674749] mlm_loss=1.55011 mlm_acc=64.82512 nsp_loss=0.03456 nsp_acc=98.768 throughput=137.0K tks/s lr=0.0000325 time=130.33 INFO:root:[step 674999] mlm_loss=1.53475 mlm_acc=66.50846 nsp_loss=0.03291 nsp_acc=98.838 throughput=128.0K tks/s lr=0.0000325 time=131.62 INFO:root:[step 674999] Saving checkpoints to /home/ubuntu/ckpt-master/0674999.params, /home/ubuntu/ckpt-master/0674999.states. INFO:root:[step 675249] mlm_loss=1.37975 mlm_acc=68.19491 nsp_loss=0.03618 nsp_acc=98.730 throughput=107.0K tks/s lr=0.0000325 time=125.14 INFO:root:[step 675499] mlm_loss=1.64475 mlm_acc=64.64499 nsp_loss=0.12303 nsp_acc=94.843 throughput=146.0K tks/s lr=0.0000325 time=157.46 INFO:root:[step 675749] mlm_loss=1.56272 mlm_acc=66.74103 nsp_loss=0.05232 nsp_acc=97.969 throughput=150.0K tks/s lr=0.0000324 time=154.22 INFO:root:[step 675999] mlm_loss=1.57315 mlm_acc=66.51628 nsp_loss=0.03178 nsp_acc=98.912 throughput=137.0K tks/s lr=0.0000324 time=125.88 INFO:root:[step 676249] mlm_loss=1.59688 mlm_acc=65.75287 nsp_loss=0.05087 nsp_acc=98.084 throughput=142.0K tks/s lr=0.0000324 time=146.15 INFO:root:[step 676499] mlm_loss=1.48591 mlm_acc=67.09291 nsp_loss=0.03056 nsp_acc=98.918 throughput=135.0K tks/s lr=0.0000324 time=116.14 INFO:root:[step 676749] mlm_loss=1.47481 mlm_acc=67.31866 nsp_loss=0.03554 nsp_acc=98.760 throughput=119.0K tks/s lr=0.0000323 time=121.08 INFO:root:[step 676999] mlm_loss=1.56251 mlm_acc=66.61445 nsp_loss=0.03152 nsp_acc=98.869 throughput=136.0K tks/s lr=0.0000323 time=116.99 INFO:root:[step 677249] mlm_loss=1.64372 mlm_acc=64.68183 nsp_loss=0.05495 nsp_acc=97.814 throughput=141.0K tks/s lr=0.0000323 time=140.70 INFO:root:[step 677499] mlm_loss=1.62117 mlm_acc=66.01911 nsp_loss=0.02534 nsp_acc=99.049 throughput=142.0K tks/s lr=0.0000323 time=136.61 INFO:root:[step 677749] mlm_loss=1.55203 mlm_acc=66.76707 nsp_loss=0.02934 nsp_acc=98.965 throughput=130.0K tks/s lr=0.0000322 time=126.72 INFO:root:[step 677999] mlm_loss=1.42800 mlm_acc=67.97374 nsp_loss=0.03443 nsp_acc=98.781 throughput=125.0K tks/s lr=0.0000322 time=111.26 INFO:root:[step 678249] mlm_loss=1.46079 mlm_acc=67.60077 nsp_loss=0.03507 nsp_acc=98.756 throughput=119.0K tks/s lr=0.0000322 time=116.17 INFO:root:[step 678499] mlm_loss=1.66060 mlm_acc=65.14769 nsp_loss=0.04226 nsp_acc=98.339 throughput=150.0K tks/s lr=0.0000322 time=152.52 INFO:root:[step 678749] mlm_loss=1.54219 mlm_acc=67.16063 nsp_loss=0.03213 nsp_acc=98.853 throughput=139.0K tks/s lr=0.0000321 time=119.90 INFO:root:[step 678999] mlm_loss=1.41690 mlm_acc=67.45119 nsp_loss=0.03771 nsp_acc=98.669 throughput=119.0K tks/s lr=0.0000321 time=121.75 INFO:root:[step 679249] mlm_loss=1.67104 mlm_acc=64.39764 nsp_loss=0.04381 nsp_acc=98.287 throughput=147.0K tks/s lr=0.0000321 time=150.07 INFO:root:overflow detected. set loss_scale = 256.0 INFO:root:[step 679499] mlm_loss=1.73763 mlm_acc=63.44775 nsp_loss=0.03672 nsp_acc=98.659 throughput=147.0K tks/s lr=0.0000321 time=143.90 INFO:root:[step 679749] mlm_loss=1.67787 mlm_acc=63.94173 nsp_loss=0.07046 nsp_acc=97.136 throughput=135.0K tks/s lr=0.0000320 time=136.62 INFO:root:[step 679999] mlm_loss=1.53170 mlm_acc=66.53690 nsp_loss=0.03180 nsp_acc=98.865 throughput=134.0K tks/s lr=0.0000320 time=129.81 INFO:root:[step 679999] Saving checkpoints to /home/ubuntu/ckpt-master/0679999.params, /home/ubuntu/ckpt-master/0679999.states. INFO:root:[step 680249] mlm_loss=1.62085 mlm_acc=66.08114 nsp_loss=0.02829 nsp_acc=98.954 throughput=123.0K tks/s lr=0.0000320 time=151.24 INFO:root:[step 680499] mlm_loss=1.56520 mlm_acc=65.52978 nsp_loss=0.04454 nsp_acc=98.301 throughput=147.0K tks/s lr=0.0000320 time=132.07 INFO:root:[step 680749] mlm_loss=1.47205 mlm_acc=67.53381 nsp_loss=0.03645 nsp_acc=98.685 throughput=118.0K tks/s lr=0.0000319 time=122.69 INFO:root:[step 680999] mlm_loss=1.42563 mlm_acc=68.02055 nsp_loss=0.03535 nsp_acc=98.730 throughput=128.0K tks/s lr=0.0000319 time=111.92 INFO:root:[step 681249] mlm_loss=1.66191 mlm_acc=65.09298 nsp_loss=0.03162 nsp_acc=98.790 throughput=149.0K tks/s lr=0.0000319 time=158.97 INFO:root:[step 681499] mlm_loss=1.58334 mlm_acc=65.06853 nsp_loss=0.04101 nsp_acc=98.506 throughput=147.0K tks/s lr=0.0000319 time=151.40 INFO:root:[step 681749] mlm_loss=1.56316 mlm_acc=66.76096 nsp_loss=0.02812 nsp_acc=98.970 throughput=137.0K tks/s lr=0.0000318 time=130.95 INFO:root:[step 681999] mlm_loss=1.54894 mlm_acc=66.58428 nsp_loss=0.02764 nsp_acc=99.027 throughput=133.0K tks/s lr=0.0000318 time=136.15 INFO:root:[step 682249] mlm_loss=1.43782 mlm_acc=67.74046 nsp_loss=0.03314 nsp_acc=98.827 throughput=134.0K tks/s lr=0.0000318 time=115.79 INFO:root:[step 682499] mlm_loss=1.52611 mlm_acc=67.07767 nsp_loss=0.03099 nsp_acc=98.864 throughput=129.0K tks/s lr=0.0000318 time=127.09 INFO:root:[step 682749] mlm_loss=1.65040 mlm_acc=65.99845 nsp_loss=0.02606 nsp_acc=99.058 throughput=142.0K tks/s lr=0.0000317 time=138.50 INFO:root:[step 682999] mlm_loss=1.47570 mlm_acc=67.48632 nsp_loss=0.03170 nsp_acc=98.905 throughput=131.0K tks/s lr=0.0000317 time=116.50 INFO:root:[step 683249] mlm_loss=1.42380 mlm_acc=68.11635 nsp_loss=0.03855 nsp_acc=98.625 throughput=109.0K tks/s lr=0.0000317 time=117.92 INFO:root:[step 683499] mlm_loss=1.31762 mlm_acc=68.42265 nsp_loss=0.04951 nsp_acc=98.210 throughput=115.0K tks/s lr=0.0000317 time=109.14 INFO:root:[step 683749] mlm_loss=1.56056 mlm_acc=64.47625 nsp_loss=0.05072 nsp_acc=98.109 throughput=151.0K tks/s lr=0.0000316 time=150.34 INFO:root:[step 683999] mlm_loss=1.56419 mlm_acc=64.88973 nsp_loss=0.03995 nsp_acc=98.500 throughput=148.0K tks/s lr=0.0000316 time=149.09 INFO:root:[step 684249] mlm_loss=1.63199 mlm_acc=65.19934 nsp_loss=0.04752 nsp_acc=98.194 throughput=137.0K tks/s lr=0.0000316 time=134.61 INFO:root:[step 684499] mlm_loss=1.66396 mlm_acc=64.06925 nsp_loss=0.06580 nsp_acc=97.415 throughput=152.0K tks/s lr=0.0000316 time=173.25 INFO:root:[step 684749] mlm_loss=1.41837 mlm_acc=67.64676 nsp_loss=0.03725 nsp_acc=98.651 throughput=127.0K tks/s lr=0.0000315 time=110.50 INFO:root:[step 684999] mlm_loss=1.55609 mlm_acc=66.26656 nsp_loss=0.03906 nsp_acc=98.526 throughput=135.0K tks/s lr=0.0000315 time=127.37 INFO:root:[step 684999] Saving checkpoints to /home/ubuntu/ckpt-master/0684999.params, /home/ubuntu/ckpt-master/0684999.states. INFO:root:[step 685249] mlm_loss=1.62533 mlm_acc=65.08345 nsp_loss=0.05184 nsp_acc=97.947 throughput=127.0K tks/s lr=0.0000315 time=155.88 INFO:root:[step 685499] mlm_loss=1.51621 mlm_acc=67.16207 nsp_loss=0.03142 nsp_acc=98.849 throughput=131.0K tks/s lr=0.0000315 time=116.34 INFO:root:[step 685749] mlm_loss=1.54969 mlm_acc=66.79857 nsp_loss=0.02725 nsp_acc=99.012 throughput=133.0K tks/s lr=0.0000314 time=127.41 INFO:root:[step 685999] mlm_loss=1.48920 mlm_acc=67.23968 nsp_loss=0.03292 nsp_acc=98.863 throughput=133.0K tks/s lr=0.0000314 time=118.92 INFO:root:[step 686249] mlm_loss=1.72863 mlm_acc=63.44742 nsp_loss=0.03389 nsp_acc=98.754 throughput=141.0K tks/s lr=0.0000314 time=157.80 INFO:root:[step 686499] mlm_loss=1.50867 mlm_acc=66.08617 nsp_loss=0.05066 nsp_acc=98.046 throughput=141.0K tks/s lr=0.0000314 time=133.52 INFO:root:[step 686749] mlm_loss=1.80578 mlm_acc=63.07808 nsp_loss=0.05809 nsp_acc=97.694 throughput=157.0K tks/s lr=0.0000313 time=157.99 INFO:root:[step 686999] mlm_loss=1.64641 mlm_acc=65.70727 nsp_loss=0.04000 nsp_acc=98.447 throughput=147.0K tks/s lr=0.0000313 time=146.22 INFO:root:[step 687249] mlm_loss=1.54237 mlm_acc=66.53791 nsp_loss=0.02904 nsp_acc=98.947 throughput=135.0K tks/s lr=0.0000313 time=136.52 INFO:root:[step 687499] mlm_loss=1.37581 mlm_acc=68.23452 nsp_loss=0.03675 nsp_acc=98.726 throughput=121.0K tks/s lr=0.0000313 time=107.37 INFO:root:[step 687749] mlm_loss=1.46468 mlm_acc=67.77126 nsp_loss=0.03211 nsp_acc=98.848 throughput=122.0K tks/s lr=0.0000312 time=123.59 INFO:root:[step 687999] mlm_loss=1.41762 mlm_acc=68.19170 nsp_loss=0.03370 nsp_acc=98.823 throughput=126.0K tks/s lr=0.0000312 time=112.03 INFO:root:[step 688249] mlm_loss=1.47817 mlm_acc=67.40444 nsp_loss=0.03085 nsp_acc=98.914 throughput=119.0K tks/s lr=0.0000312 time=122.37 INFO:root:[step 688499] mlm_loss=1.64585 mlm_acc=64.31940 nsp_loss=0.05495 nsp_acc=97.868 throughput=143.0K tks/s lr=0.0000312 time=123.19 INFO:root:[step 688749] mlm_loss=1.72824 mlm_acc=64.57697 nsp_loss=0.03433 nsp_acc=98.717 throughput=146.0K tks/s lr=0.0000311 time=153.30 INFO:root:[step 688999] mlm_loss=1.76113 mlm_acc=63.44296 nsp_loss=0.04089 nsp_acc=98.383 throughput=154.0K tks/s lr=0.0000311 time=154.31 INFO:root:[step 689249] mlm_loss=1.37121 mlm_acc=68.35680 nsp_loss=0.03353 nsp_acc=98.830 throughput=119.0K tks/s lr=0.0000311 time=121.93 INFO:root:[step 689499] mlm_loss=1.46572 mlm_acc=66.63472 nsp_loss=0.04476 nsp_acc=98.305 throughput=142.0K tks/s lr=0.0000311 time=120.85 INFO:root:[step 689749] mlm_loss=1.46053 mlm_acc=67.67277 nsp_loss=0.03168 nsp_acc=98.847 throughput=128.0K tks/s lr=0.0000310 time=128.41 INFO:root:[step 689999] mlm_loss=1.53704 mlm_acc=67.00913 nsp_loss=0.02452 nsp_acc=99.183 throughput=131.0K tks/s lr=0.0000310 time=126.18 INFO:root:[step 689999] Saving checkpoints to /home/ubuntu/ckpt-master/0689999.params, /home/ubuntu/ckpt-master/0689999.states. INFO:root:[step 690249] mlm_loss=1.47709 mlm_acc=67.53289 nsp_loss=0.02681 nsp_acc=99.056 throughput=118.0K tks/s lr=0.0000310 time=131.76 INFO:root:[step 690499] mlm_loss=1.35957 mlm_acc=68.59221 nsp_loss=0.03154 nsp_acc=98.881 throughput=123.0K tks/s lr=0.0000310 time=107.85 INFO:root:[step 690749] mlm_loss=1.66378 mlm_acc=64.33410 nsp_loss=0.07208 nsp_acc=97.059 throughput=151.0K tks/s lr=0.0000309 time=170.03 INFO:root:[step 690999] mlm_loss=1.43301 mlm_acc=66.79806 nsp_loss=0.02949 nsp_acc=98.962 throughput=139.0K tks/s lr=0.0000309 time=126.28 INFO:root:[step 691249] mlm_loss=1.47478 mlm_acc=66.18838 nsp_loss=0.05214 nsp_acc=97.991 throughput=134.0K tks/s lr=0.0000309 time=135.09 INFO:root:[step 691499] mlm_loss=1.37774 mlm_acc=68.43400 nsp_loss=0.02933 nsp_acc=98.960 throughput=116.0K tks/s lr=0.0000309 time=117.65 INFO:root:[step 691749] mlm_loss=1.40647 mlm_acc=68.51584 nsp_loss=0.03139 nsp_acc=98.913 throughput=129.0K tks/s lr=0.0000308 time=115.16 INFO:root:[step 691999] mlm_loss=1.48552 mlm_acc=66.83959 nsp_loss=0.02759 nsp_acc=99.037 throughput=137.0K tks/s lr=0.0000308 time=132.02 INFO:root:[step 692249] mlm_loss=1.46001 mlm_acc=66.62321 nsp_loss=0.03029 nsp_acc=98.911 throughput=131.0K tks/s lr=0.0000308 time=124.25 INFO:root:[step 692499] mlm_loss=1.44189 mlm_acc=67.49130 nsp_loss=0.02978 nsp_acc=98.937 throughput=123.0K tks/s lr=0.0000308 time=122.23 INFO:root:[step 692749] mlm_loss=1.61449 mlm_acc=65.47630 nsp_loss=0.04203 nsp_acc=98.416 throughput=141.0K tks/s lr=0.0000307 time=143.37 INFO:root:[step 692999] mlm_loss=1.54360 mlm_acc=66.74568 nsp_loss=0.02156 nsp_acc=99.268 throughput=140.0K tks/s lr=0.0000307 time=133.97 INFO:root:[step 693249] mlm_loss=1.69151 mlm_acc=63.65752 nsp_loss=0.02530 nsp_acc=99.130 throughput=148.0K tks/s lr=0.0000307 time=146.75 INFO:root:[step 693499] mlm_loss=1.45308 mlm_acc=67.78604 nsp_loss=0.02218 nsp_acc=99.231 throughput=123.0K tks/s lr=0.0000307 time=123.06 INFO:root:[step 693749] mlm_loss=1.50473 mlm_acc=67.19740 nsp_loss=0.02738 nsp_acc=99.061 throughput=137.0K tks/s lr=0.0000306 time=120.56 INFO:root:[step 693999] mlm_loss=1.42951 mlm_acc=67.93283 nsp_loss=0.02882 nsp_acc=98.989 throughput=117.0K tks/s lr=0.0000306 time=119.59 INFO:root:[step 694249] mlm_loss=1.55522 mlm_acc=65.51272 nsp_loss=0.03687 nsp_acc=98.557 throughput=149.0K tks/s lr=0.0000306 time=131.66 INFO:root:[step 694499] mlm_loss=1.59944 mlm_acc=66.40740 nsp_loss=0.01818 nsp_acc=99.372 throughput=140.0K tks/s lr=0.0000306 time=137.37 INFO:root:[step 694749] mlm_loss=1.54569 mlm_acc=67.17391 nsp_loss=0.02395 nsp_acc=99.155 throughput=132.0K tks/s lr=0.0000305 time=128.45 INFO:root:[step 694999] mlm_loss=1.52265 mlm_acc=67.25347 nsp_loss=0.02211 nsp_acc=99.211 throughput=128.0K tks/s lr=0.0000305 time=129.09 INFO:root:[step 694999] Saving checkpoints to /home/ubuntu/ckpt-master/0694999.params, /home/ubuntu/ckpt-master/0694999.states. INFO:root:[step 695249] mlm_loss=1.51092 mlm_acc=66.85039 nsp_loss=0.02466 nsp_acc=99.111 throughput=118.0K tks/s lr=0.0000305 time=146.67 INFO:root:[step 695499] mlm_loss=1.40390 mlm_acc=68.03800 nsp_loss=0.03319 nsp_acc=98.813 throughput=123.0K tks/s lr=0.0000305 time=109.24 INFO:root:[step 695749] mlm_loss=1.37614 mlm_acc=68.36662 nsp_loss=0.03206 nsp_acc=98.866 throughput=119.0K tks/s lr=0.0000304 time=108.39 INFO:root:[step 695999] mlm_loss=1.36288 mlm_acc=68.42269 nsp_loss=0.03456 nsp_acc=98.786 throughput=117.0K tks/s lr=0.0000304 time=115.44 INFO:root:[step 696249] mlm_loss=1.59544 mlm_acc=64.65261 nsp_loss=0.04060 nsp_acc=98.497 throughput=143.0K tks/s lr=0.0000304 time=130.86 INFO:root:[step 696499] mlm_loss=1.58975 mlm_acc=66.24155 nsp_loss=0.01827 nsp_acc=99.372 throughput=145.0K tks/s lr=0.0000304 time=140.50 INFO:root:[step 696749] mlm_loss=1.37913 mlm_acc=69.38104 nsp_loss=0.03112 nsp_acc=98.896 throughput=132.0K tks/s lr=0.0000303 time=129.91 INFO:root:[step 696999] mlm_loss=1.55989 mlm_acc=66.90784 nsp_loss=0.02235 nsp_acc=99.182 throughput=138.0K tks/s lr=0.0000303 time=133.82 INFO:root:[step 697249] mlm_loss=1.74190 mlm_acc=63.51086 nsp_loss=0.04460 nsp_acc=98.329 throughput=157.0K tks/s lr=0.0000303 time=156.63 INFO:root:[step 697499] mlm_loss=1.54361 mlm_acc=66.76184 nsp_loss=0.01974 nsp_acc=99.317 throughput=137.0K tks/s lr=0.0000303 time=135.80 INFO:root:[step 697749] mlm_loss=1.41354 mlm_acc=68.08200 nsp_loss=0.02941 nsp_acc=98.924 throughput=121.0K tks/s lr=0.0000302 time=117.91 INFO:root:[step 697999] mlm_loss=1.62796 mlm_acc=65.89988 nsp_loss=0.03072 nsp_acc=98.803 throughput=141.0K tks/s lr=0.0000302 time=136.63 INFO:root:[step 698249] mlm_loss=1.66501 mlm_acc=64.05367 nsp_loss=0.07628 nsp_acc=96.822 throughput=150.0K tks/s lr=0.0000302 time=151.58 INFO:root:[step 698499] mlm_loss=1.57927 mlm_acc=66.69397 nsp_loss=0.01988 nsp_acc=99.306 throughput=141.0K tks/s lr=0.0000302 time=136.82 INFO:root:[step 698749] mlm_loss=1.38778 mlm_acc=68.68338 nsp_loss=0.02882 nsp_acc=98.986 throughput=129.0K tks/s lr=0.0000301 time=115.86 INFO:root:[step 698999] mlm_loss=1.34556 mlm_acc=68.60254 nsp_loss=0.03315 nsp_acc=98.872 throughput=109.0K tks/s lr=0.0000301 time=118.16 INFO:root:[step 699249] mlm_loss=1.33778 mlm_acc=68.87595 nsp_loss=0.03478 nsp_acc=98.798 throughput=116.0K tks/s lr=0.0000301 time=109.05 INFO:root:[step 699499] mlm_loss=1.36911 mlm_acc=68.32748 nsp_loss=0.02907 nsp_acc=99.002 throughput=124.0K tks/s lr=0.0000301 time=110.19 INFO:root:[step 699749] mlm_loss=1.57933 mlm_acc=65.69841 nsp_loss=0.02477 nsp_acc=99.152 throughput=141.0K tks/s lr=0.0000300 time=132.79 INFO:root:[step 699999] mlm_loss=1.75211 mlm_acc=63.51851 nsp_loss=0.03130 nsp_acc=98.846 throughput=154.0K tks/s lr=0.0000300 time=171.32 INFO:root:[step 699999] Saving checkpoints to /home/ubuntu/ckpt-master/0699999.params, /home/ubuntu/ckpt-master/0699999.states. INFO:root:[step 700249] mlm_loss=1.50842 mlm_acc=66.98492 nsp_loss=0.02975 nsp_acc=98.929 throughput=121.0K tks/s lr=0.0000300 time=137.78 INFO:root:[step 700499] mlm_loss=1.73441 mlm_acc=62.76029 nsp_loss=0.06834 nsp_acc=97.264 throughput=148.0K tks/s lr=0.0000300 time=160.40 INFO:root:[step 700749] mlm_loss=1.55136 mlm_acc=67.19144 nsp_loss=0.02273 nsp_acc=99.168 throughput=139.0K tks/s lr=0.0000299 time=145.25 INFO:root:[step 700999] mlm_loss=1.40977 mlm_acc=67.97799 nsp_loss=0.03310 nsp_acc=98.802 throughput=124.0K tks/s lr=0.0000299 time=109.04 INFO:root:[step 701249] mlm_loss=1.61808 mlm_acc=64.37424 nsp_loss=0.03695 nsp_acc=98.622 throughput=141.0K tks/s lr=0.0000299 time=141.26 INFO:root:[step 701499] mlm_loss=1.62821 mlm_acc=64.65689 nsp_loss=0.05496 nsp_acc=97.833 throughput=149.0K tks/s lr=0.0000299 time=147.85 INFO:root:[step 701749] mlm_loss=1.60337 mlm_acc=65.63623 nsp_loss=0.02971 nsp_acc=98.897 throughput=138.0K tks/s lr=0.0000298 time=136.84 INFO:root:[step 701999] mlm_loss=1.44426 mlm_acc=67.77432 nsp_loss=0.02889 nsp_acc=99.001 throughput=126.0K tks/s lr=0.0000298 time=113.04 INFO:root:[step 702249] mlm_loss=1.69038 mlm_acc=63.98296 nsp_loss=0.02523 nsp_acc=99.103 throughput=148.0K tks/s lr=0.0000298 time=143.93 INFO:root:[step 702499] mlm_loss=1.36282 mlm_acc=68.31628 nsp_loss=0.03010 nsp_acc=98.970 throughput=118.0K tks/s lr=0.0000298 time=123.88 INFO:root:[step 702749] mlm_loss=1.38785 mlm_acc=68.45798 nsp_loss=0.02663 nsp_acc=99.133 throughput=129.0K tks/s lr=0.0000297 time=112.98 INFO:root:[step 702999] mlm_loss=1.39301 mlm_acc=68.45476 nsp_loss=0.02873 nsp_acc=99.020 throughput=114.0K tks/s lr=0.0000297 time=117.33 INFO:root:[step 703249] mlm_loss=1.53994 mlm_acc=65.88657 nsp_loss=0.03748 nsp_acc=98.581 throughput=141.0K tks/s lr=0.0000297 time=139.50 INFO:root:[step 703499] mlm_loss=1.55488 mlm_acc=65.35788 nsp_loss=0.03401 nsp_acc=98.769 throughput=144.0K tks/s lr=0.0000297 time=122.71 INFO:root:[step 703749] mlm_loss=1.67488 mlm_acc=64.84541 nsp_loss=0.04568 nsp_acc=98.169 throughput=154.0K tks/s lr=0.0000296 time=170.64 INFO:root:[step 703999] mlm_loss=1.48352 mlm_acc=66.71163 nsp_loss=0.04344 nsp_acc=98.356 throughput=134.0K tks/s lr=0.0000296 time=123.17 INFO:root:[step 704249] mlm_loss=1.44876 mlm_acc=66.91344 nsp_loss=0.05322 nsp_acc=97.968 throughput=129.0K tks/s lr=0.0000296 time=127.51 INFO:root:[step 704499] mlm_loss=1.62715 mlm_acc=65.67634 nsp_loss=0.06045 nsp_acc=97.487 throughput=146.0K tks/s lr=0.0000296 time=147.65 INFO:root:[step 704749] mlm_loss=1.76866 mlm_acc=63.57015 nsp_loss=0.06893 nsp_acc=97.228 throughput=154.0K tks/s lr=0.0000295 time=155.87 INFO:root:[step 704999] mlm_loss=1.60584 mlm_acc=65.40069 nsp_loss=0.11378 nsp_acc=95.153 throughput=143.0K tks/s lr=0.0000295 time=145.05 INFO:root:[step 704999] Saving checkpoints to /home/ubuntu/ckpt-master/0704999.params, /home/ubuntu/ckpt-master/0704999.states. INFO:root:[step 705249] mlm_loss=1.51581 mlm_acc=67.14971 nsp_loss=0.03805 nsp_acc=98.560 throughput=114.0K tks/s lr=0.0000295 time=142.63 INFO:root:[step 705499] mlm_loss=1.45630 mlm_acc=67.72828 nsp_loss=0.03043 nsp_acc=98.942 throughput=128.0K tks/s lr=0.0000295 time=111.75 INFO:root:[step 705749] mlm_loss=1.40727 mlm_acc=68.10445 nsp_loss=0.03033 nsp_acc=98.930 throughput=116.0K tks/s lr=0.0000294 time=120.20 INFO:root:[step 705999] mlm_loss=1.39837 mlm_acc=68.58852 nsp_loss=0.02955 nsp_acc=98.967 throughput=123.0K tks/s lr=0.0000294 time=111.33 INFO:root:[step 706249] mlm_loss=1.67044 mlm_acc=64.34387 nsp_loss=0.03673 nsp_acc=98.590 throughput=150.0K tks/s lr=0.0000294 time=147.97 INFO:root:[step 706499] mlm_loss=1.45175 mlm_acc=67.50192 nsp_loss=0.02911 nsp_acc=98.994 throughput=120.0K tks/s lr=0.0000294 time=124.28 INFO:root:[step 706749] mlm_loss=1.37379 mlm_acc=68.30876 nsp_loss=0.03163 nsp_acc=98.905 throughput=122.0K tks/s lr=0.0000293 time=113.33 INFO:root:[step 706999] mlm_loss=1.50342 mlm_acc=66.82693 nsp_loss=0.02666 nsp_acc=99.069 throughput=128.0K tks/s lr=0.0000293 time=126.13 INFO:root:[step 707249] mlm_loss=1.38983 mlm_acc=68.41566 nsp_loss=0.02994 nsp_acc=98.926 throughput=121.0K tks/s lr=0.0000293 time=111.06 INFO:root:[step 707499] mlm_loss=1.49472 mlm_acc=67.39859 nsp_loss=0.02375 nsp_acc=99.182 throughput=126.0K tks/s lr=0.0000293 time=123.79 INFO:root:[step 707749] mlm_loss=1.54335 mlm_acc=65.58306 nsp_loss=0.04941 nsp_acc=98.111 throughput=142.0K tks/s lr=0.0000292 time=137.86 INFO:root:[step 707999] mlm_loss=1.61911 mlm_acc=66.00588 nsp_loss=0.02078 nsp_acc=99.255 throughput=139.0K tks/s lr=0.0000292 time=143.57 INFO:root:[step 708249] mlm_loss=1.51912 mlm_acc=65.81150 nsp_loss=0.04697 nsp_acc=98.217 throughput=140.0K tks/s lr=0.0000292 time=139.18 INFO:root:[step 708499] mlm_loss=1.47698 mlm_acc=67.69402 nsp_loss=0.02842 nsp_acc=98.982 throughput=131.0K tks/s lr=0.0000292 time=117.87 INFO:root:[step 708749] mlm_loss=1.37260 mlm_acc=68.88787 nsp_loss=0.03207 nsp_acc=98.889 throughput=118.0K tks/s lr=0.0000291 time=108.46 INFO:root:[step 708999] mlm_loss=1.70440 mlm_acc=63.61659 nsp_loss=0.04044 nsp_acc=98.446 throughput=155.0K tks/s lr=0.0000291 time=169.43 INFO:root:[step 709249] mlm_loss=1.65193 mlm_acc=64.49675 nsp_loss=0.04616 nsp_acc=98.186 throughput=144.0K tks/s lr=0.0000291 time=146.27 INFO:root:[step 709499] mlm_loss=1.36935 mlm_acc=68.45336 nsp_loss=0.03530 nsp_acc=98.714 throughput=123.0K tks/s lr=0.0000291 time=111.61 INFO:root:[step 709749] mlm_loss=1.47197 mlm_acc=67.30188 nsp_loss=0.03460 nsp_acc=98.786 throughput=130.0K tks/s lr=0.0000290 time=130.88 INFO:root:[step 709999] mlm_loss=1.43207 mlm_acc=67.95731 nsp_loss=0.03546 nsp_acc=98.745 throughput=124.0K tks/s lr=0.0000290 time=124.51 INFO:root:[step 709999] Saving checkpoints to /home/ubuntu/ckpt-master/0709999.params, /home/ubuntu/ckpt-master/0709999.states. INFO:root:[step 710249] mlm_loss=1.41675 mlm_acc=67.83569 nsp_loss=0.02976 nsp_acc=98.950 throughput=117.0K tks/s lr=0.0000290 time=129.28 INFO:root:[step 710499] mlm_loss=1.58343 mlm_acc=66.26872 nsp_loss=0.02235 nsp_acc=99.206 throughput=139.0K tks/s lr=0.0000290 time=136.63 INFO:root:[step 710749] mlm_loss=1.45792 mlm_acc=68.18757 nsp_loss=0.02912 nsp_acc=98.991 throughput=123.0K tks/s lr=0.0000289 time=120.52 INFO:root:[step 710999] mlm_loss=1.70866 mlm_acc=64.44130 nsp_loss=0.04311 nsp_acc=98.328 throughput=145.0K tks/s lr=0.0000289 time=127.53 INFO:root:[step 711249] mlm_loss=1.44836 mlm_acc=66.56901 nsp_loss=0.03963 nsp_acc=98.557 throughput=124.0K tks/s lr=0.0000289 time=125.09 INFO:root:[step 711499] mlm_loss=1.40739 mlm_acc=66.48506 nsp_loss=0.04281 nsp_acc=98.404 throughput=130.0K tks/s lr=0.0000289 time=121.01 INFO:root:[step 711749] mlm_loss=1.64785 mlm_acc=65.37153 nsp_loss=0.02153 nsp_acc=99.226 throughput=150.0K tks/s lr=0.0000288 time=161.26 INFO:root:[step 711999] mlm_loss=1.46592 mlm_acc=67.14698 nsp_loss=0.03106 nsp_acc=98.826 throughput=133.0K tks/s lr=0.0000288 time=133.44 INFO:root:[step 712249] mlm_loss=1.37068 mlm_acc=68.43749 nsp_loss=0.02902 nsp_acc=98.995 throughput=125.0K tks/s lr=0.0000288 time=109.96 INFO:root:[step 712499] mlm_loss=1.58744 mlm_acc=65.77910 nsp_loss=0.02224 nsp_acc=99.231 throughput=143.0K tks/s lr=0.0000288 time=138.29 INFO:root:[step 712749] mlm_loss=1.47143 mlm_acc=67.69852 nsp_loss=0.02730 nsp_acc=99.051 throughput=124.0K tks/s lr=0.0000287 time=122.97 INFO:root:[step 712999] mlm_loss=1.60924 mlm_acc=66.12615 nsp_loss=0.02508 nsp_acc=99.064 throughput=145.0K tks/s lr=0.0000287 time=139.75 INFO:root:[step 713249] mlm_loss=1.71628 mlm_acc=64.05854 nsp_loss=0.04207 nsp_acc=98.398 throughput=154.0K tks/s lr=0.0000287 time=153.17 INFO:root:[step 713499] mlm_loss=1.42899 mlm_acc=66.47532 nsp_loss=0.03361 nsp_acc=98.837 throughput=128.0K tks/s lr=0.0000287 time=128.50 INFO:root:[step 713749] mlm_loss=1.60582 mlm_acc=65.48001 nsp_loss=0.03507 nsp_acc=98.647 throughput=148.0K tks/s lr=0.0000286 time=152.56 INFO:root:[step 713999] mlm_loss=1.27731 mlm_acc=69.24546 nsp_loss=0.04031 nsp_acc=98.569 throughput=113.0K tks/s lr=0.0000286 time=106.56 INFO:root:[step 714249] mlm_loss=1.26436 mlm_acc=69.60458 nsp_loss=0.03783 nsp_acc=98.684 throughput=108.0K tks/s lr=0.0000286 time=103.22 INFO:root:[step 714499] mlm_loss=1.57782 mlm_acc=66.05263 nsp_loss=0.02302 nsp_acc=99.166 throughput=140.0K tks/s lr=0.0000286 time=136.82 INFO:root:[step 714749] mlm_loss=1.80746 mlm_acc=62.49905 nsp_loss=0.04396 nsp_acc=98.270 throughput=151.0K tks/s lr=0.0000285 time=165.29 INFO:root:[step 714999] mlm_loss=1.45039 mlm_acc=67.58499 nsp_loss=0.02924 nsp_acc=98.942 throughput=133.0K tks/s lr=0.0000285 time=111.75 INFO:root:[step 714999] Saving checkpoints to /home/ubuntu/ckpt-master/0714999.params, /home/ubuntu/ckpt-master/0714999.states. INFO:root:[step 715249] mlm_loss=1.67917 mlm_acc=64.96537 nsp_loss=0.02835 nsp_acc=98.932 throughput=142.0K tks/s lr=0.0000285 time=171.22 INFO:root:[step 715499] mlm_loss=1.61274 mlm_acc=66.22057 nsp_loss=0.02355 nsp_acc=99.175 throughput=142.0K tks/s lr=0.0000285 time=139.91 INFO:root:[step 715749] mlm_loss=1.33496 mlm_acc=67.76735 nsp_loss=0.04332 nsp_acc=98.414 throughput=120.0K tks/s lr=0.0000284 time=123.16 INFO:root:[step 715999] mlm_loss=1.73577 mlm_acc=62.84467 nsp_loss=0.08646 nsp_acc=96.355 throughput=153.0K tks/s lr=0.0000284 time=161.03 INFO:root:[step 716249] mlm_loss=1.52094 mlm_acc=65.18383 nsp_loss=0.05853 nsp_acc=97.674 throughput=138.0K tks/s lr=0.0000284 time=141.03 INFO:root:[step 716499] mlm_loss=1.17520 mlm_acc=74.18246 nsp_loss=0.04302 nsp_acc=98.562 throughput=132.0K tks/s lr=0.0000284 time=132.50 INFO:root:[step 716749] mlm_loss=1.62737 mlm_acc=64.51078 nsp_loss=0.03918 nsp_acc=98.477 throughput=138.0K tks/s lr=0.0000283 time=137.92 INFO:root:[step 716999] mlm_loss=1.39267 mlm_acc=67.16247 nsp_loss=0.04209 nsp_acc=98.430 throughput=143.0K tks/s lr=0.0000283 time=121.67 INFO:root:[step 717249] mlm_loss=1.50899 mlm_acc=66.85382 nsp_loss=0.03168 nsp_acc=98.904 throughput=130.0K tks/s lr=0.0000283 time=130.36 INFO:root:[step 717499] mlm_loss=1.46829 mlm_acc=67.65859 nsp_loss=0.02726 nsp_acc=99.072 throughput=129.0K tks/s lr=0.0000283 time=115.94 INFO:root:[step 717749] mlm_loss=1.62172 mlm_acc=66.14952 nsp_loss=0.02030 nsp_acc=99.260 throughput=140.0K tks/s lr=0.0000282 time=137.21 INFO:root:[step 717999] mlm_loss=1.62830 mlm_acc=66.12326 nsp_loss=0.02324 nsp_acc=99.213 throughput=142.0K tks/s lr=0.0000282 time=139.80 INFO:root:[step 718249] mlm_loss=1.38926 mlm_acc=68.11517 nsp_loss=0.03119 nsp_acc=98.931 throughput=117.0K tks/s lr=0.0000282 time=120.12 INFO:root:[step 718499] mlm_loss=1.43276 mlm_acc=68.02999 nsp_loss=0.03246 nsp_acc=98.895 throughput=123.0K tks/s lr=0.0000282 time=111.59 INFO:root:[step 718749] mlm_loss=1.33348 mlm_acc=68.50391 nsp_loss=0.03600 nsp_acc=98.705 throughput=117.0K tks/s lr=0.0000281 time=108.63 INFO:root:[step 718999] mlm_loss=1.53157 mlm_acc=64.73812 nsp_loss=0.03076 nsp_acc=98.886 throughput=134.0K tks/s lr=0.0000281 time=138.95 INFO:root:[step 719249] mlm_loss=1.54372 mlm_acc=66.79567 nsp_loss=0.02846 nsp_acc=99.006 throughput=129.0K tks/s lr=0.0000281 time=128.01 INFO:root:[step 719499] mlm_loss=1.36319 mlm_acc=68.37891 nsp_loss=0.03591 nsp_acc=98.742 throughput=117.0K tks/s lr=0.0000281 time=109.87 INFO:root:[step 719749] mlm_loss=1.36806 mlm_acc=68.87772 nsp_loss=0.03221 nsp_acc=98.834 throughput=110.0K tks/s lr=0.0000280 time=115.41 INFO:root:[step 719999] mlm_loss=1.35234 mlm_acc=68.76803 nsp_loss=0.03483 nsp_acc=98.783 throughput=122.0K tks/s lr=0.0000280 time=110.43 INFO:root:[step 719999] Saving checkpoints to /home/ubuntu/ckpt-master/0719999.params, /home/ubuntu/ckpt-master/0719999.states. INFO:root:[step 720249] mlm_loss=1.50405 mlm_acc=65.90683 nsp_loss=0.05570 nsp_acc=97.813 throughput=134.0K tks/s lr=0.0000280 time=158.30 INFO:root:[step 720499] mlm_loss=1.60468 mlm_acc=65.04607 nsp_loss=0.08704 nsp_acc=96.417 throughput=141.0K tks/s lr=0.0000280 time=145.52 INFO:root:[step 720749] mlm_loss=1.50914 mlm_acc=66.87904 nsp_loss=0.02777 nsp_acc=98.978 throughput=138.0K tks/s lr=0.0000279 time=120.69 INFO:root:[step 720999] mlm_loss=1.79240 mlm_acc=62.22387 nsp_loss=0.06049 nsp_acc=97.659 throughput=117.0K tks/s lr=0.0000279 time=125.66 INFO:root:[step 721249] mlm_loss=1.43981 mlm_acc=67.84059 nsp_loss=0.03087 nsp_acc=98.914 throughput=128.0K tks/s lr=0.0000279 time=113.37 INFO:root:[step 721499] mlm_loss=1.58762 mlm_acc=66.99475 nsp_loss=0.02305 nsp_acc=99.225 throughput=141.0K tks/s lr=0.0000279 time=136.11 INFO:root:[step 721749] mlm_loss=1.51292 mlm_acc=66.32093 nsp_loss=0.03046 nsp_acc=98.887 throughput=136.0K tks/s lr=0.0000278 time=133.60 INFO:root:[step 721999] mlm_loss=1.35736 mlm_acc=68.66305 nsp_loss=0.03623 nsp_acc=98.729 throughput=116.0K tks/s lr=0.0000278 time=105.06 INFO:root:[step 722249] mlm_loss=1.46030 mlm_acc=66.44417 nsp_loss=0.03244 nsp_acc=98.875 throughput=123.0K tks/s lr=0.0000278 time=121.39 INFO:root:[step 722499] mlm_loss=1.78863 mlm_acc=62.84316 nsp_loss=0.02523 nsp_acc=99.029 throughput=153.0K tks/s lr=0.0000278 time=172.59 INFO:root:[step 722749] mlm_loss=1.54149 mlm_acc=66.75454 nsp_loss=0.02551 nsp_acc=99.094 throughput=142.0K tks/s lr=0.0000277 time=120.89 INFO:root:[step 722999] mlm_loss=1.48357 mlm_acc=66.49065 nsp_loss=0.03028 nsp_acc=98.952 throughput=124.0K tks/s lr=0.0000277 time=125.00 INFO:root:[step 723249] mlm_loss=1.36708 mlm_acc=66.39997 nsp_loss=0.04524 nsp_acc=98.424 throughput=130.0K tks/s lr=0.0000277 time=121.46 INFO:root:[step 723499] mlm_loss=1.47445 mlm_acc=67.24003 nsp_loss=0.02780 nsp_acc=99.029 throughput=127.0K tks/s lr=0.0000277 time=127.22 INFO:root:[step 723999] mlm_loss=2.85439 mlm_acc=67.73548 nsp_loss=0.05873 nsp_acc=98.968 throughput=128.0K tks/s lr=0.0000276 time=243.17 INFO:root:[step 724249] mlm_loss=1.74808 mlm_acc=64.14165 nsp_loss=0.03808 nsp_acc=98.506 throughput=146.0K tks/s lr=0.0000276 time=144.05 INFO:root:[step 724499] mlm_loss=1.62267 mlm_acc=65.69318 nsp_loss=0.02940 nsp_acc=98.928 throughput=139.0K tks/s lr=0.0000276 time=146.34 INFO:root:[step 724749] mlm_loss=1.90015 mlm_acc=62.03602 nsp_loss=0.07425 nsp_acc=96.943 throughput=151.0K tks/s lr=0.0000275 time=151.15 INFO:root:[step 724999] mlm_loss=1.77335 mlm_acc=63.98108 nsp_loss=0.04643 nsp_acc=98.198 throughput=144.0K tks/s lr=0.0000275 time=141.16 INFO:root:[step 724999] Saving checkpoints to /home/ubuntu/ckpt-master/0724999.params, /home/ubuntu/ckpt-master/0724999.states. INFO:root:[step 725249] mlm_loss=1.42545 mlm_acc=67.07543 nsp_loss=0.03691 nsp_acc=98.674 throughput=119.0K tks/s lr=0.0000275 time=139.20 INFO:root:[step 725499] mlm_loss=1.61230 mlm_acc=65.76406 nsp_loss=0.07248 nsp_acc=96.977 throughput=138.0K tks/s lr=0.0000275 time=138.21 INFO:root:[step 725749] mlm_loss=1.47670 mlm_acc=66.46388 nsp_loss=0.03513 nsp_acc=98.713 throughput=130.0K tks/s lr=0.0000274 time=127.47 INFO:root:[step 725999] mlm_loss=1.60572 mlm_acc=65.39535 nsp_loss=0.03191 nsp_acc=98.833 throughput=141.0K tks/s lr=0.0000274 time=138.83 INFO:root:[step 726249] mlm_loss=1.45814 mlm_acc=67.52887 nsp_loss=0.02897 nsp_acc=98.995 throughput=127.0K tks/s lr=0.0000274 time=116.60 INFO:root:[step 726499] mlm_loss=1.29903 mlm_acc=69.28302 nsp_loss=0.03507 nsp_acc=98.848 throughput=109.0K tks/s lr=0.0000274 time=117.08 INFO:root:[step 726749] mlm_loss=1.58227 mlm_acc=66.86418 nsp_loss=0.02482 nsp_acc=99.135 throughput=142.0K tks/s lr=0.0000273 time=122.02 INFO:root:[step 726999] mlm_loss=1.44181 mlm_acc=67.84519 nsp_loss=0.04033 nsp_acc=98.521 throughput=117.0K tks/s lr=0.0000273 time=118.67 INFO:root:[step 727249] mlm_loss=1.46265 mlm_acc=68.05823 nsp_loss=0.02999 nsp_acc=98.996 throughput=131.0K tks/s lr=0.0000273 time=115.52 INFO:root:[step 727499] mlm_loss=1.64412 mlm_acc=65.03670 nsp_loss=0.05328 nsp_acc=97.850 throughput=144.0K tks/s lr=0.0000273 time=141.98 INFO:root:[step 727749] mlm_loss=1.60093 mlm_acc=66.47828 nsp_loss=0.02268 nsp_acc=99.215 throughput=140.0K tks/s lr=0.0000272 time=136.18 INFO:root:[step 727999] mlm_loss=1.46084 mlm_acc=67.82985 nsp_loss=0.03133 nsp_acc=98.855 throughput=119.0K tks/s lr=0.0000272 time=119.54 INFO:root:[step 728249] mlm_loss=1.53510 mlm_acc=66.11682 nsp_loss=0.06232 nsp_acc=97.460 throughput=143.0K tks/s lr=0.0000272 time=129.27 INFO:root:[step 728499] mlm_loss=1.53118 mlm_acc=66.80953 nsp_loss=0.05313 nsp_acc=97.957 throughput=147.0K tks/s lr=0.0000272 time=146.44 INFO:root:[step 728749] mlm_loss=1.38457 mlm_acc=68.41126 nsp_loss=0.03112 nsp_acc=98.912 throughput=115.0K tks/s lr=0.0000271 time=120.03 INFO:root:[step 728999] mlm_loss=1.60332 mlm_acc=66.54555 nsp_loss=0.02181 nsp_acc=99.241 throughput=135.0K tks/s lr=0.0000271 time=134.36 INFO:root:[step 729249] mlm_loss=1.55716 mlm_acc=67.01324 nsp_loss=0.02251 nsp_acc=99.202 throughput=142.0K tks/s lr=0.0000271 time=123.31 INFO:root:[step 729499] mlm_loss=1.45911 mlm_acc=68.73052 nsp_loss=0.03050 nsp_acc=98.938 throughput=129.0K tks/s lr=0.0000271 time=127.50 INFO:root:[step 729749] mlm_loss=1.46338 mlm_acc=68.64400 nsp_loss=0.02669 nsp_acc=99.073 throughput=141.0K tks/s lr=0.0000270 time=140.86 INFO:root:[step 729999] mlm_loss=1.35008 mlm_acc=68.96744 nsp_loss=0.03029 nsp_acc=98.966 throughput=121.0K tks/s lr=0.0000270 time=109.08 INFO:root:[step 729999] Saving checkpoints to /home/ubuntu/ckpt-master/0729999.params, /home/ubuntu/ckpt-master/0729999.states. INFO:root:[step 730249] mlm_loss=1.55295 mlm_acc=65.88146 nsp_loss=0.09027 nsp_acc=96.214 throughput=114.0K tks/s lr=0.0000270 time=143.93 INFO:root:[step 730499] mlm_loss=1.43374 mlm_acc=68.22953 nsp_loss=0.03002 nsp_acc=98.965 throughput=127.0K tks/s lr=0.0000270 time=111.31 INFO:root:[step 730749] mlm_loss=1.35900 mlm_acc=68.69439 nsp_loss=0.03256 nsp_acc=98.837 throughput=115.0K tks/s lr=0.0000269 time=107.08 INFO:root:[step 730999] mlm_loss=1.25330 mlm_acc=68.39133 nsp_loss=0.04712 nsp_acc=98.363 throughput=118.0K tks/s lr=0.0000269 time=116.85 INFO:root:[step 731249] mlm_loss=1.76265 mlm_acc=63.07007 nsp_loss=0.03893 nsp_acc=98.512 throughput=165.0K tks/s lr=0.0000269 time=176.66 INFO:root:[step 731499] mlm_loss=1.57146 mlm_acc=66.97495 nsp_loss=0.02320 nsp_acc=99.185 throughput=136.0K tks/s lr=0.0000269 time=132.03 INFO:root:[step 731749] mlm_loss=1.37550 mlm_acc=71.35630 nsp_loss=0.03502 nsp_acc=98.806 throughput=147.0K tks/s lr=0.0000268 time=141.92 INFO:root:[step 731999] mlm_loss=1.35838 mlm_acc=69.95893 nsp_loss=0.03491 nsp_acc=98.783 throughput=120.0K tks/s lr=0.0000268 time=123.60 INFO:root:[step 732249] mlm_loss=1.38257 mlm_acc=68.53654 nsp_loss=0.03127 nsp_acc=98.917 throughput=119.0K tks/s lr=0.0000268 time=111.54 INFO:root:[step 732499] mlm_loss=1.55473 mlm_acc=64.94435 nsp_loss=0.04647 nsp_acc=98.308 throughput=130.0K tks/s lr=0.0000268 time=131.39 INFO:root:[step 732749] mlm_loss=1.45833 mlm_acc=66.73150 nsp_loss=0.05867 nsp_acc=97.723 throughput=139.0K tks/s lr=0.0000267 time=119.83 INFO:root:[step 732999] mlm_loss=1.49962 mlm_acc=66.43469 nsp_loss=0.05473 nsp_acc=97.816 throughput=129.0K tks/s lr=0.0000267 time=127.74 INFO:root:[step 733249] mlm_loss=1.59200 mlm_acc=65.87689 nsp_loss=0.05092 nsp_acc=98.038 throughput=133.0K tks/s lr=0.0000267 time=135.06 INFO:root:[step 733499] mlm_loss=1.57042 mlm_acc=66.56459 nsp_loss=0.02287 nsp_acc=99.195 throughput=138.0K tks/s lr=0.0000267 time=133.72 INFO:root:[step 733749] mlm_loss=1.51300 mlm_acc=67.47924 nsp_loss=0.02881 nsp_acc=98.958 throughput=132.0K tks/s lr=0.0000266 time=118.19 INFO:root:[step 733999] mlm_loss=1.53651 mlm_acc=67.24054 nsp_loss=0.02536 nsp_acc=99.106 throughput=130.0K tks/s lr=0.0000266 time=128.20 INFO:root:[step 734249] mlm_loss=1.57733 mlm_acc=65.94029 nsp_loss=0.04463 nsp_acc=98.319 throughput=147.0K tks/s lr=0.0000266 time=147.49 INFO:root:[step 734499] mlm_loss=1.43611 mlm_acc=68.09478 nsp_loss=0.02957 nsp_acc=98.951 throughput=127.0K tks/s lr=0.0000266 time=112.71 INFO:root:[step 734749] mlm_loss=1.51894 mlm_acc=67.23625 nsp_loss=0.02686 nsp_acc=99.031 throughput=124.0K tks/s lr=0.0000265 time=126.05 INFO:root:[step 734999] mlm_loss=1.55515 mlm_acc=66.79483 nsp_loss=0.02760 nsp_acc=99.022 throughput=130.0K tks/s lr=0.0000265 time=131.48 INFO:root:[step 734999] Saving checkpoints to /home/ubuntu/ckpt-master/0734999.params, /home/ubuntu/ckpt-master/0734999.states. INFO:root:[step 735249] mlm_loss=1.37856 mlm_acc=68.85457 nsp_loss=0.03151 nsp_acc=98.893 throughput=107.0K tks/s lr=0.0000265 time=122.61 INFO:root:[step 735499] mlm_loss=1.37878 mlm_acc=68.68608 nsp_loss=0.02897 nsp_acc=98.975 throughput=122.0K tks/s lr=0.0000265 time=109.86 INFO:root:[step 735749] mlm_loss=1.50348 mlm_acc=67.48472 nsp_loss=0.02443 nsp_acc=99.120 throughput=133.0K tks/s lr=0.0000264 time=129.18 INFO:root:[step 735999] mlm_loss=1.40659 mlm_acc=68.11746 nsp_loss=0.03235 nsp_acc=98.887 throughput=121.0K tks/s lr=0.0000264 time=125.14 INFO:root:[step 736249] mlm_loss=1.48288 mlm_acc=67.40329 nsp_loss=0.02360 nsp_acc=99.167 throughput=136.0K tks/s lr=0.0000264 time=120.00 INFO:root:[step 736499] mlm_loss=1.71935 mlm_acc=63.72518 nsp_loss=0.06773 nsp_acc=97.267 throughput=149.0K tks/s lr=0.0000264 time=148.92 INFO:root:[step 736749] mlm_loss=1.72810 mlm_acc=64.11208 nsp_loss=0.04445 nsp_acc=98.269 throughput=143.0K tks/s lr=0.0000263 time=159.47 INFO:root:[step 736999] mlm_loss=1.37748 mlm_acc=68.26959 nsp_loss=0.03448 nsp_acc=98.818 throughput=121.0K tks/s lr=0.0000263 time=113.30 INFO:root:[step 737249] mlm_loss=1.32976 mlm_acc=68.61921 nsp_loss=0.04187 nsp_acc=98.492 throughput=115.0K tks/s lr=0.0000263 time=107.17 INFO:root:[step 737499] mlm_loss=1.35165 mlm_acc=68.40901 nsp_loss=0.03889 nsp_acc=98.612 throughput=106.0K tks/s lr=0.0000263 time=119.93 INFO:root:[step 737749] mlm_loss=1.42033 mlm_acc=67.95124 nsp_loss=0.02913 nsp_acc=98.981 throughput=133.0K tks/s lr=0.0000262 time=113.27 INFO:root:[step 737999] mlm_loss=1.45501 mlm_acc=67.68358 nsp_loss=0.02962 nsp_acc=98.931 throughput=122.0K tks/s lr=0.0000262 time=119.33 INFO:root:[step 738249] mlm_loss=1.79474 mlm_acc=62.82228 nsp_loss=0.04006 nsp_acc=98.517 throughput=158.0K tks/s lr=0.0000262 time=159.22 INFO:root:[step 738499] mlm_loss=1.57976 mlm_acc=65.55154 nsp_loss=0.03036 nsp_acc=98.900 throughput=138.0K tks/s lr=0.0000262 time=135.33 INFO:root:[step 738749] mlm_loss=1.47233 mlm_acc=67.61395 nsp_loss=0.03198 nsp_acc=98.878 throughput=120.0K tks/s lr=0.0000261 time=121.22 INFO:root:[step 738999] mlm_loss=1.46597 mlm_acc=67.79354 nsp_loss=0.03020 nsp_acc=98.948 throughput=130.0K tks/s lr=0.0000261 time=115.84 INFO:root:[step 739249] mlm_loss=1.40398 mlm_acc=68.28594 nsp_loss=0.03381 nsp_acc=98.774 throughput=127.0K tks/s lr=0.0000261 time=110.31 INFO:root:[step 739499] mlm_loss=1.77971 mlm_acc=63.15663 nsp_loss=0.03695 nsp_acc=98.655 throughput=154.0K tks/s lr=0.0000261 time=168.75 INFO:root:[step 739749] mlm_loss=1.76194 mlm_acc=63.33321 nsp_loss=0.06084 nsp_acc=97.579 throughput=159.0K tks/s lr=0.0000260 time=176.91 INFO:root:[step 739999] mlm_loss=1.52280 mlm_acc=64.84542 nsp_loss=0.04709 nsp_acc=98.184 throughput=134.0K tks/s lr=0.0000260 time=126.81 INFO:root:[step 739999] Saving checkpoints to /home/ubuntu/ckpt-master/0739999.params, /home/ubuntu/ckpt-master/0739999.states. INFO:root:[step 740249] mlm_loss=1.15678 mlm_acc=74.70824 nsp_loss=0.04598 nsp_acc=98.387 throughput=126.0K tks/s lr=0.0000260 time=151.37 INFO:root:[step 740499] mlm_loss=1.47802 mlm_acc=67.75609 nsp_loss=0.02751 nsp_acc=99.030 throughput=125.0K tks/s lr=0.0000260 time=128.80 INFO:root:[step 740749] mlm_loss=1.36410 mlm_acc=68.62925 nsp_loss=0.03444 nsp_acc=98.883 throughput=126.0K tks/s lr=0.0000259 time=108.56 INFO:root:[step 740999] mlm_loss=1.35124 mlm_acc=68.22325 nsp_loss=0.04501 nsp_acc=98.284 throughput=118.0K tks/s lr=0.0000259 time=110.69 INFO:root:[step 741249] mlm_loss=1.48323 mlm_acc=67.19432 nsp_loss=0.03452 nsp_acc=98.724 throughput=126.0K tks/s lr=0.0000259 time=122.69 INFO:root:[step 741499] mlm_loss=1.53078 mlm_acc=65.34119 nsp_loss=0.03471 nsp_acc=98.770 throughput=143.0K tks/s lr=0.0000259 time=144.86 INFO:root:[step 741749] mlm_loss=1.38546 mlm_acc=68.61286 nsp_loss=0.03483 nsp_acc=98.781 throughput=123.0K tks/s lr=0.0000258 time=109.37 INFO:root:[step 741999] mlm_loss=1.62975 mlm_acc=64.96932 nsp_loss=0.03016 nsp_acc=98.900 throughput=143.0K tks/s lr=0.0000258 time=138.31 INFO:root:[step 742249] mlm_loss=1.74331 mlm_acc=63.39426 nsp_loss=0.03843 nsp_acc=98.528 throughput=150.0K tks/s lr=0.0000258 time=165.27 INFO:root:[step 742499] mlm_loss=1.46361 mlm_acc=66.81667 nsp_loss=0.06865 nsp_acc=97.196 throughput=133.0K tks/s lr=0.0000258 time=121.93 INFO:root:[step 742749] mlm_loss=1.63475 mlm_acc=64.41446 nsp_loss=0.08571 nsp_acc=96.412 throughput=147.0K tks/s lr=0.0000257 time=145.26 INFO:root:[step 742999] mlm_loss=1.58473 mlm_acc=65.93823 nsp_loss=0.05659 nsp_acc=97.735 throughput=146.0K tks/s lr=0.0000257 time=162.22 INFO:root:[step 743249] mlm_loss=1.42368 mlm_acc=67.54206 nsp_loss=0.03455 nsp_acc=98.800 throughput=133.0K tks/s lr=0.0000257 time=114.14 INFO:root:[step 743499] mlm_loss=1.72101 mlm_acc=64.23148 nsp_loss=0.03406 nsp_acc=98.701 throughput=154.0K tks/s lr=0.0000257 time=153.09 INFO:root:[step 743749] mlm_loss=1.44830 mlm_acc=67.87541 nsp_loss=0.03158 nsp_acc=98.862 throughput=120.0K tks/s lr=0.0000256 time=124.99 INFO:root:[step 743999] mlm_loss=1.46275 mlm_acc=67.13430 nsp_loss=0.02565 nsp_acc=99.093 throughput=130.0K tks/s lr=0.0000256 time=127.79 INFO:root:[step 744249] mlm_loss=1.53094 mlm_acc=67.13214 nsp_loss=0.02686 nsp_acc=99.063 throughput=137.0K tks/s lr=0.0000256 time=117.52 INFO:root:[step 744499] mlm_loss=1.37282 mlm_acc=68.61614 nsp_loss=0.03526 nsp_acc=98.836 throughput=114.0K tks/s lr=0.0000256 time=119.01 INFO:root:[step 744749] mlm_loss=1.42882 mlm_acc=68.17318 nsp_loss=0.03311 nsp_acc=98.778 throughput=128.0K tks/s lr=0.0000255 time=112.64 INFO:root:[step 744999] mlm_loss=1.48477 mlm_acc=66.93934 nsp_loss=0.06230 nsp_acc=97.509 throughput=141.0K tks/s lr=0.0000255 time=139.84 INFO:root:[step 744999] Saving checkpoints to /home/ubuntu/ckpt-master/0744999.params, /home/ubuntu/ckpt-master/0744999.states. INFO:root:[step 745249] mlm_loss=1.57014 mlm_acc=66.05772 nsp_loss=0.04816 nsp_acc=98.145 throughput=134.0K tks/s lr=0.0000255 time=160.14 INFO:root:[step 745499] mlm_loss=1.64994 mlm_acc=64.75478 nsp_loss=0.06084 nsp_acc=97.524 throughput=150.0K tks/s lr=0.0000255 time=145.76 INFO:root:[step 745749] mlm_loss=1.64355 mlm_acc=65.51504 nsp_loss=0.03219 nsp_acc=98.755 throughput=145.0K tks/s lr=0.0000254 time=146.03 INFO:root:[step 745999] mlm_loss=1.54883 mlm_acc=66.42564 nsp_loss=0.02662 nsp_acc=99.051 throughput=133.0K tks/s lr=0.0000254 time=130.22 INFO:root:[step 746249] mlm_loss=1.56225 mlm_acc=66.70297 nsp_loss=0.02482 nsp_acc=99.120 throughput=139.0K tks/s lr=0.0000254 time=132.77 INFO:root:[step 746499] mlm_loss=1.71166 mlm_acc=63.44360 nsp_loss=0.03354 nsp_acc=98.803 throughput=143.0K tks/s lr=0.0000254 time=144.95 INFO:root:[step 746749] mlm_loss=1.41029 mlm_acc=68.42642 nsp_loss=0.03076 nsp_acc=98.939 throughput=123.0K tks/s lr=0.0000253 time=112.01 INFO:root:[step 746999] mlm_loss=1.64286 mlm_acc=64.31552 nsp_loss=0.03146 nsp_acc=98.814 throughput=143.0K tks/s lr=0.0000253 time=142.17 INFO:root:[step 747249] mlm_loss=1.37604 mlm_acc=68.34412 nsp_loss=0.04430 nsp_acc=98.377 throughput=117.0K tks/s lr=0.0000253 time=117.23 INFO:root:[step 747499] mlm_loss=1.59296 mlm_acc=66.09332 nsp_loss=0.04988 nsp_acc=98.053 throughput=143.0K tks/s lr=0.0000253 time=144.39 INFO:root:[step 747749] mlm_loss=1.60178 mlm_acc=66.55528 nsp_loss=0.02409 nsp_acc=99.165 throughput=138.0K tks/s lr=0.0000252 time=133.06 INFO:root:[step 747999] mlm_loss=1.58953 mlm_acc=66.68199 nsp_loss=0.02301 nsp_acc=99.175 throughput=146.0K tks/s lr=0.0000252 time=125.82 INFO:root:[step 748249] mlm_loss=1.55331 mlm_acc=66.09088 nsp_loss=0.03562 nsp_acc=98.664 throughput=143.0K tks/s lr=0.0000252 time=141.94 INFO:root:[step 748499] mlm_loss=1.53474 mlm_acc=66.90763 nsp_loss=0.02746 nsp_acc=99.016 throughput=133.0K tks/s lr=0.0000252 time=131.39 INFO:root:[step 748749] mlm_loss=1.66598 mlm_acc=64.83821 nsp_loss=0.03874 nsp_acc=98.458 throughput=154.0K tks/s lr=0.0000251 time=154.30 INFO:root:[step 748999] mlm_loss=1.49265 mlm_acc=67.50752 nsp_loss=0.02862 nsp_acc=98.981 throughput=127.0K tks/s lr=0.0000251 time=128.05 INFO:root:[step 749249] mlm_loss=1.40997 mlm_acc=68.23572 nsp_loss=0.02859 nsp_acc=99.003 throughput=118.0K tks/s lr=0.0000251 time=118.10 INFO:root:[step 749499] mlm_loss=1.55342 mlm_acc=66.74460 nsp_loss=0.02888 nsp_acc=98.969 throughput=137.0K tks/s lr=0.0000251 time=124.31 INFO:root:[step 749749] mlm_loss=1.55333 mlm_acc=66.23216 nsp_loss=0.04146 nsp_acc=98.477 throughput=136.0K tks/s lr=0.0000250 time=131.26 INFO:root:[step 749999] mlm_loss=1.48174 mlm_acc=66.49533 nsp_loss=0.04175 nsp_acc=98.444 throughput=127.0K tks/s lr=0.0000250 time=132.24 INFO:root:[step 749999] Saving checkpoints to /home/ubuntu/ckpt-master/0749999.params, /home/ubuntu/ckpt-master/0749999.states. INFO:root:[step 750249] mlm_loss=1.54578 mlm_acc=65.43475 nsp_loss=0.03269 nsp_acc=98.825 throughput=129.0K tks/s lr=0.0000250 time=149.86 INFO:root:[step 750499] mlm_loss=1.67659 mlm_acc=64.42255 nsp_loss=0.03623 nsp_acc=98.608 throughput=148.0K tks/s lr=0.0000250 time=153.67 INFO:root:[step 750749] mlm_loss=1.43532 mlm_acc=68.26443 nsp_loss=0.03147 nsp_acc=98.897 throughput=124.0K tks/s lr=0.0000249 time=109.52 INFO:root:[step 750999] mlm_loss=1.61186 mlm_acc=64.78465 nsp_loss=0.03341 nsp_acc=98.779 throughput=140.0K tks/s lr=0.0000249 time=138.25 INFO:root:[step 751249] mlm_loss=1.71222 mlm_acc=63.44018 nsp_loss=0.05446 nsp_acc=97.814 throughput=147.0K tks/s lr=0.0000249 time=143.15 INFO:root:[step 751499] mlm_loss=1.46217 mlm_acc=67.34597 nsp_loss=0.03541 nsp_acc=98.682 throughput=128.0K tks/s lr=0.0000249 time=127.33 INFO:root:[step 751749] mlm_loss=1.58521 mlm_acc=66.73592 nsp_loss=0.02379 nsp_acc=99.171 throughput=138.0K tks/s lr=0.0000248 time=133.21 INFO:root:[step 751999] mlm_loss=1.52872 mlm_acc=67.25970 nsp_loss=0.02627 nsp_acc=99.086 throughput=138.0K tks/s lr=0.0000248 time=122.28 INFO:root:[step 752249] mlm_loss=1.50978 mlm_acc=66.37267 nsp_loss=0.03658 nsp_acc=98.609 throughput=130.0K tks/s lr=0.0000248 time=127.25 INFO:root:[step 752499] mlm_loss=1.59339 mlm_acc=65.59783 nsp_loss=0.04189 nsp_acc=98.407 throughput=134.0K tks/s lr=0.0000248 time=136.44 INFO:root:[step 752749] mlm_loss=1.40739 mlm_acc=68.29282 nsp_loss=0.03041 nsp_acc=98.963 throughput=125.0K tks/s lr=0.0000247 time=112.26 INFO:root:[step 752999] mlm_loss=1.51422 mlm_acc=66.46458 nsp_loss=0.02785 nsp_acc=99.019 throughput=133.0K tks/s lr=0.0000247 time=131.01 INFO:root:[step 753249] mlm_loss=1.26780 mlm_acc=69.65234 nsp_loss=0.03893 nsp_acc=98.610 throughput=109.0K tks/s lr=0.0000247 time=106.70 INFO:root:[step 753499] mlm_loss=1.39351 mlm_acc=66.70322 nsp_loss=0.04798 nsp_acc=98.257 throughput=133.0K tks/s lr=0.0000247 time=134.75 INFO:root:[step 753749] mlm_loss=1.42939 mlm_acc=67.99354 nsp_loss=0.03074 nsp_acc=98.953 throughput=125.0K tks/s lr=0.0000246 time=110.98 INFO:root:[step 753999] mlm_loss=1.24910 mlm_acc=72.99435 nsp_loss=0.04133 nsp_acc=98.588 throughput=145.0K tks/s lr=0.0000246 time=138.94 INFO:root:[step 754249] mlm_loss=1.44970 mlm_acc=67.52614 nsp_loss=0.03417 nsp_acc=98.776 throughput=117.0K tks/s lr=0.0000246 time=125.35 INFO:root:[step 754499] mlm_loss=1.39751 mlm_acc=68.62338 nsp_loss=0.03416 nsp_acc=98.772 throughput=119.0K tks/s lr=0.0000246 time=107.58 INFO:root:[step 754749] mlm_loss=1.36625 mlm_acc=68.63797 nsp_loss=0.03468 nsp_acc=98.753 throughput=115.0K tks/s lr=0.0000245 time=106.30 INFO:root:[step 754999] mlm_loss=1.28339 mlm_acc=69.12950 nsp_loss=0.03929 nsp_acc=98.576 throughput=116.0K tks/s lr=0.0000245 time=108.23 INFO:root:[step 754999] Saving checkpoints to /home/ubuntu/ckpt-master/0754999.params, /home/ubuntu/ckpt-master/0754999.states. INFO:root:[step 755249] mlm_loss=1.42010 mlm_acc=67.49408 nsp_loss=0.03607 nsp_acc=98.690 throughput=109.0K tks/s lr=0.0000245 time=135.14 INFO:root:[step 755499] mlm_loss=1.49306 mlm_acc=66.21932 nsp_loss=0.04457 nsp_acc=98.334 throughput=137.0K tks/s lr=0.0000245 time=126.70 INFO:root:[step 755749] mlm_loss=1.44203 mlm_acc=67.96453 nsp_loss=0.02974 nsp_acc=98.916 throughput=118.0K tks/s lr=0.0000244 time=117.21 INFO:root:[step 755999] mlm_loss=1.47748 mlm_acc=67.26595 nsp_loss=0.02822 nsp_acc=99.010 throughput=133.0K tks/s lr=0.0000244 time=117.44 INFO:root:[step 756249] mlm_loss=1.46602 mlm_acc=67.66957 nsp_loss=0.02785 nsp_acc=99.054 throughput=124.0K tks/s lr=0.0000244 time=124.43 INFO:root:[step 756499] mlm_loss=1.44205 mlm_acc=67.74998 nsp_loss=0.03017 nsp_acc=98.897 throughput=130.0K tks/s lr=0.0000244 time=119.51 INFO:root:[step 756749] mlm_loss=1.42397 mlm_acc=67.87118 nsp_loss=0.05468 nsp_acc=97.825 throughput=120.0K tks/s lr=0.0000243 time=123.43 INFO:root:[step 756999] mlm_loss=1.59962 mlm_acc=66.13142 nsp_loss=0.05291 nsp_acc=97.856 throughput=138.0K tks/s lr=0.0000243 time=137.32 INFO:root:[step 757249] mlm_loss=1.49087 mlm_acc=67.69008 nsp_loss=0.02673 nsp_acc=99.061 throughput=129.0K tks/s lr=0.0000243 time=114.13 INFO:root:[step 757499] mlm_loss=1.63188 mlm_acc=65.32941 nsp_loss=0.05809 nsp_acc=97.681 throughput=151.0K tks/s lr=0.0000243 time=148.00 INFO:root:[step 757749] mlm_loss=1.56246 mlm_acc=65.96398 nsp_loss=0.04114 nsp_acc=98.427 throughput=135.0K tks/s lr=0.0000242 time=132.75 INFO:root:[step 757999] mlm_loss=1.54731 mlm_acc=66.46262 nsp_loss=0.02879 nsp_acc=98.991 throughput=135.0K tks/s lr=0.0000242 time=134.69 INFO:root:[step 758249] mlm_loss=1.57259 mlm_acc=65.56092 nsp_loss=0.04243 nsp_acc=98.350 throughput=135.0K tks/s lr=0.0000242 time=135.96 INFO:root:[step 758499] mlm_loss=1.52807 mlm_acc=65.65348 nsp_loss=0.04790 nsp_acc=98.184 throughput=143.0K tks/s lr=0.0000242 time=122.73 INFO:root:[step 758749] mlm_loss=1.41795 mlm_acc=67.95130 nsp_loss=0.02936 nsp_acc=98.978 throughput=122.0K tks/s lr=0.0000241 time=122.49 INFO:root:[step 758999] mlm_loss=1.75247 mlm_acc=63.87164 nsp_loss=0.06602 nsp_acc=97.359 throughput=149.0K tks/s lr=0.0000241 time=148.68 INFO:root:[step 759249] mlm_loss=1.53856 mlm_acc=66.36446 nsp_loss=0.03959 nsp_acc=98.558 throughput=125.0K tks/s lr=0.0000241 time=123.10 INFO:root:[step 759499] mlm_loss=1.63669 mlm_acc=65.87459 nsp_loss=0.02186 nsp_acc=99.239 throughput=143.0K tks/s lr=0.0000241 time=141.17 INFO:root:[step 759749] mlm_loss=1.79032 mlm_acc=63.77875 nsp_loss=0.04969 nsp_acc=98.062 throughput=150.0K tks/s lr=0.0000240 time=145.74 INFO:root:[step 759999] mlm_loss=1.63331 mlm_acc=65.43790 nsp_loss=0.03353 nsp_acc=98.771 throughput=140.0K tks/s lr=0.0000240 time=137.00 INFO:root:[step 759999] Saving checkpoints to /home/ubuntu/ckpt-master/0759999.params, /home/ubuntu/ckpt-master/0759999.states. INFO:root:[step 760249] mlm_loss=1.51614 mlm_acc=67.73652 nsp_loss=0.02729 nsp_acc=99.067 throughput=122.0K tks/s lr=0.0000240 time=135.53 INFO:root:[step 760499] mlm_loss=1.55223 mlm_acc=65.88466 nsp_loss=0.05113 nsp_acc=98.023 throughput=126.0K tks/s lr=0.0000240 time=127.01 INFO:root:[step 760749] mlm_loss=1.46031 mlm_acc=66.42200 nsp_loss=0.04605 nsp_acc=98.232 throughput=125.0K tks/s lr=0.0000239 time=115.76 INFO:root:[step 760999] mlm_loss=1.38048 mlm_acc=68.19165 nsp_loss=0.04066 nsp_acc=98.494 throughput=121.0K tks/s lr=0.0000239 time=123.02 INFO:root:[step 761249] mlm_loss=1.73152 mlm_acc=63.75477 nsp_loss=0.07850 nsp_acc=96.839 throughput=153.0K tks/s lr=0.0000239 time=156.93 INFO:root:[step 761499] mlm_loss=1.64174 mlm_acc=65.71004 nsp_loss=0.03673 nsp_acc=98.571 throughput=144.0K tks/s lr=0.0000239 time=140.29 INFO:root:[step 761749] mlm_loss=1.52139 mlm_acc=66.49001 nsp_loss=0.02991 nsp_acc=98.876 throughput=135.0K tks/s lr=0.0000238 time=135.54 INFO:root:[step 761999] mlm_loss=1.43794 mlm_acc=66.78442 nsp_loss=0.03638 nsp_acc=98.709 throughput=122.0K tks/s lr=0.0000238 time=130.32 INFO:root:[step 762249] mlm_loss=1.41685 mlm_acc=66.66029 nsp_loss=0.04501 nsp_acc=98.372 throughput=135.0K tks/s lr=0.0000238 time=113.88 INFO:root:[step 762499] mlm_loss=1.39110 mlm_acc=66.63835 nsp_loss=0.05532 nsp_acc=97.849 throughput=125.0K tks/s lr=0.0000238 time=117.55 INFO:root:[step 762749] mlm_loss=1.66115 mlm_acc=64.22263 nsp_loss=0.02807 nsp_acc=98.984 throughput=141.0K tks/s lr=0.0000237 time=153.42 INFO:root:[step 762999] mlm_loss=1.51244 mlm_acc=67.35081 nsp_loss=0.02957 nsp_acc=98.938 throughput=134.0K tks/s lr=0.0000237 time=117.61 INFO:root:[step 763249] mlm_loss=1.56163 mlm_acc=66.21397 nsp_loss=0.05069 nsp_acc=98.077 throughput=149.0K tks/s lr=0.0000237 time=147.89 INFO:root:[step 763499] mlm_loss=1.46823 mlm_acc=67.69336 nsp_loss=0.02907 nsp_acc=98.978 throughput=122.0K tks/s lr=0.0000237 time=123.93 INFO:root:[step 763749] mlm_loss=1.45947 mlm_acc=67.80497 nsp_loss=0.02818 nsp_acc=99.034 throughput=131.0K tks/s lr=0.0000236 time=114.27 INFO:root:[step 763999] mlm_loss=1.45414 mlm_acc=67.84500 nsp_loss=0.03023 nsp_acc=98.942 throughput=116.0K tks/s lr=0.0000236 time=120.30 INFO:root:[step 764249] mlm_loss=1.56197 mlm_acc=65.75980 nsp_loss=0.02963 nsp_acc=98.956 throughput=146.0K tks/s lr=0.0000236 time=140.91 INFO:root:[step 764499] mlm_loss=1.56436 mlm_acc=66.40367 nsp_loss=0.03171 nsp_acc=98.820 throughput=141.0K tks/s lr=0.0000236 time=141.35 INFO:root:[step 764749] mlm_loss=1.60994 mlm_acc=66.35337 nsp_loss=0.02336 nsp_acc=99.155 throughput=140.0K tks/s lr=0.0000235 time=136.60 INFO:root:[step 764999] mlm_loss=1.59530 mlm_acc=66.72454 nsp_loss=0.02340 nsp_acc=99.157 throughput=136.0K tks/s lr=0.0000235 time=132.69 INFO:root:[step 764999] Saving checkpoints to /home/ubuntu/ckpt-master/0764999.params, /home/ubuntu/ckpt-master/0764999.states. INFO:root:[step 765249] mlm_loss=1.58026 mlm_acc=66.78804 nsp_loss=0.02275 nsp_acc=99.197 throughput=130.0K tks/s lr=0.0000235 time=140.24 INFO:root:[step 765499] mlm_loss=1.63457 mlm_acc=65.86909 nsp_loss=0.02064 nsp_acc=99.265 throughput=140.0K tks/s lr=0.0000235 time=145.09 INFO:root:[step 765749] mlm_loss=1.68015 mlm_acc=63.44962 nsp_loss=0.02828 nsp_acc=98.917 throughput=149.0K tks/s lr=0.0000234 time=155.03 INFO:root:[step 765999] mlm_loss=1.32903 mlm_acc=69.00515 nsp_loss=0.02610 nsp_acc=99.136 throughput=124.0K tks/s lr=0.0000234 time=111.18 INFO:root:[step 766249] mlm_loss=1.42515 mlm_acc=66.58758 nsp_loss=0.07178 nsp_acc=97.022 throughput=128.0K tks/s lr=0.0000234 time=130.73 INFO:root:[step 766499] mlm_loss=1.35436 mlm_acc=68.55375 nsp_loss=0.02644 nsp_acc=99.072 throughput=130.0K tks/s lr=0.0000234 time=111.51 INFO:root:[step 766749] mlm_loss=1.49783 mlm_acc=67.33488 nsp_loss=0.02097 nsp_acc=99.282 throughput=130.0K tks/s lr=0.0000233 time=130.53 INFO:root:[step 766999] mlm_loss=1.43632 mlm_acc=68.16121 nsp_loss=0.02197 nsp_acc=99.261 throughput=134.0K tks/s lr=0.0000233 time=112.91 INFO:root:[step 767249] mlm_loss=1.53203 mlm_acc=66.58197 nsp_loss=0.03222 nsp_acc=98.817 throughput=142.0K tks/s lr=0.0000233 time=140.81 INFO:root:[step 767499] mlm_loss=1.20326 mlm_acc=69.61308 nsp_loss=0.04424 nsp_acc=98.429 throughput=112.0K tks/s lr=0.0000233 time=117.21 INFO:root:[step 767749] mlm_loss=1.55140 mlm_acc=66.15222 nsp_loss=0.02372 nsp_acc=99.181 throughput=142.0K tks/s lr=0.0000232 time=137.12 INFO:root:[step 767999] mlm_loss=1.60887 mlm_acc=65.77595 nsp_loss=0.02656 nsp_acc=99.033 throughput=151.0K tks/s lr=0.0000232 time=152.89 INFO:root:[step 768249] mlm_loss=1.63351 mlm_acc=65.52950 nsp_loss=0.04338 nsp_acc=98.358 throughput=145.0K tks/s lr=0.0000232 time=144.58 INFO:root:[step 768499] mlm_loss=1.61434 mlm_acc=65.76654 nsp_loss=0.02339 nsp_acc=99.141 throughput=147.0K tks/s lr=0.0000232 time=139.77 INFO:root:[step 768749] mlm_loss=1.38114 mlm_acc=67.51727 nsp_loss=0.03217 nsp_acc=98.866 throughput=129.0K tks/s lr=0.0000231 time=116.71 INFO:root:[step 768999] mlm_loss=1.47740 mlm_acc=67.32184 nsp_loss=0.02313 nsp_acc=99.196 throughput=130.0K tks/s lr=0.0000231 time=127.90 INFO:root:[step 769249] mlm_loss=1.49647 mlm_acc=65.74208 nsp_loss=0.04251 nsp_acc=98.382 throughput=135.0K tks/s lr=0.0000231 time=137.21 INFO:root:[step 769499] mlm_loss=1.38978 mlm_acc=68.52833 nsp_loss=0.02561 nsp_acc=99.096 throughput=122.0K tks/s lr=0.0000231 time=113.05 INFO:root:[step 769749] mlm_loss=1.38962 mlm_acc=67.66683 nsp_loss=0.02867 nsp_acc=98.990 throughput=121.0K tks/s lr=0.0000230 time=119.65 INFO:root:[step 769999] mlm_loss=1.59610 mlm_acc=65.04616 nsp_loss=0.02302 nsp_acc=99.159 throughput=142.0K tks/s lr=0.0000230 time=147.18 INFO:root:[step 769999] Saving checkpoints to /home/ubuntu/ckpt-master/0769999.params, /home/ubuntu/ckpt-master/0769999.states. INFO:root:[step 770249] mlm_loss=1.39240 mlm_acc=68.42520 nsp_loss=0.02886 nsp_acc=98.986 throughput=111.0K tks/s lr=0.0000230 time=125.52 INFO:root:[step 770499] mlm_loss=1.45117 mlm_acc=67.47601 nsp_loss=0.02607 nsp_acc=99.054 throughput=127.0K tks/s lr=0.0000230 time=128.25 INFO:root:[step 770749] mlm_loss=1.37394 mlm_acc=68.40918 nsp_loss=0.02922 nsp_acc=98.958 throughput=125.0K tks/s lr=0.0000229 time=110.71 INFO:root:[step 770999] mlm_loss=1.65016 mlm_acc=64.84290 nsp_loss=0.02706 nsp_acc=98.981 throughput=143.0K tks/s lr=0.0000229 time=140.37 INFO:root:[step 771249] mlm_loss=1.70897 mlm_acc=64.68629 nsp_loss=0.03088 nsp_acc=98.819 throughput=145.0K tks/s lr=0.0000229 time=145.74 INFO:root:[step 771499] mlm_loss=1.45956 mlm_acc=66.76155 nsp_loss=0.03628 nsp_acc=98.666 throughput=131.0K tks/s lr=0.0000229 time=130.15 INFO:root:[step 771749] mlm_loss=1.66380 mlm_acc=65.05839 nsp_loss=0.08239 nsp_acc=96.458 throughput=144.0K tks/s lr=0.0000228 time=143.10 INFO:root:[step 771999] mlm_loss=1.40764 mlm_acc=68.30979 nsp_loss=0.02817 nsp_acc=99.022 throughput=125.0K tks/s lr=0.0000228 time=121.72 INFO:root:[step 772249] mlm_loss=1.14718 mlm_acc=75.17179 nsp_loss=0.03177 nsp_acc=98.985 throughput=146.0K tks/s lr=0.0000228 time=129.93 INFO:root:[step 772499] mlm_loss=1.51345 mlm_acc=67.44196 nsp_loss=0.02148 nsp_acc=99.240 throughput=128.0K tks/s lr=0.0000228 time=127.51 INFO:root:[step 772749] mlm_loss=1.51265 mlm_acc=67.32117 nsp_loss=0.02046 nsp_acc=99.299 throughput=130.0K tks/s lr=0.0000227 time=126.63 INFO:root:[step 772999] mlm_loss=1.65705 mlm_acc=64.56463 nsp_loss=0.02702 nsp_acc=99.044 throughput=150.0K tks/s lr=0.0000227 time=149.54 INFO:root:[step 773249] mlm_loss=1.48144 mlm_acc=67.62847 nsp_loss=0.02416 nsp_acc=99.171 throughput=133.0K tks/s lr=0.0000227 time=115.85 INFO:root:[step 773499] mlm_loss=1.58332 mlm_acc=66.42826 nsp_loss=0.01911 nsp_acc=99.348 throughput=144.0K tks/s lr=0.0000227 time=139.42 INFO:root:[step 773749] mlm_loss=1.39730 mlm_acc=67.66547 nsp_loss=0.02943 nsp_acc=98.927 throughput=119.0K tks/s lr=0.0000226 time=119.55 INFO:root:[step 773999] mlm_loss=1.55786 mlm_acc=65.54719 nsp_loss=0.03185 nsp_acc=98.808 throughput=134.0K tks/s lr=0.0000226 time=133.22 INFO:root:[step 774249] mlm_loss=1.50898 mlm_acc=66.06820 nsp_loss=0.06644 nsp_acc=97.312 throughput=133.0K tks/s lr=0.0000226 time=124.88 INFO:root:[step 774499] mlm_loss=1.55637 mlm_acc=65.56620 nsp_loss=0.05728 nsp_acc=97.770 throughput=143.0K tks/s lr=0.0000226 time=141.02 INFO:root:[step 774749] mlm_loss=1.61539 mlm_acc=64.01245 nsp_loss=0.03768 nsp_acc=98.651 throughput=146.0K tks/s lr=0.0000225 time=148.86 INFO:root:[step 774999] mlm_loss=1.30533 mlm_acc=69.11811 nsp_loss=0.03204 nsp_acc=98.881 throughput=117.0K tks/s lr=0.0000225 time=107.21 INFO:root:[step 774999] Saving checkpoints to /home/ubuntu/ckpt-master/0774999.params, /home/ubuntu/ckpt-master/0774999.states. INFO:root:[step 775249] mlm_loss=1.29212 mlm_acc=68.80955 nsp_loss=0.03338 nsp_acc=98.833 throughput=98.0K tks/s lr=0.0000225 time=134.57 INFO:root:[step 775499] mlm_loss=1.32812 mlm_acc=69.28893 nsp_loss=0.03742 nsp_acc=98.719 throughput=122.0K tks/s lr=0.0000225 time=109.95 INFO:root:[step 775749] mlm_loss=1.42411 mlm_acc=67.76601 nsp_loss=0.03003 nsp_acc=98.930 throughput=130.0K tks/s lr=0.0000224 time=131.50 INFO:root:[step 775999] mlm_loss=1.31853 mlm_acc=69.23196 nsp_loss=0.02954 nsp_acc=98.966 throughput=119.0K tks/s lr=0.0000224 time=109.76 INFO:root:[step 776249] mlm_loss=1.48231 mlm_acc=66.18411 nsp_loss=0.07040 nsp_acc=97.197 throughput=145.0K tks/s lr=0.0000224 time=142.52 INFO:root:[step 776499] mlm_loss=1.38761 mlm_acc=67.66251 nsp_loss=0.03987 nsp_acc=98.492 throughput=127.0K tks/s lr=0.0000224 time=127.97 INFO:root:[step 776749] mlm_loss=1.42892 mlm_acc=68.33661 nsp_loss=0.02727 nsp_acc=99.070 throughput=130.0K tks/s lr=0.0000223 time=116.14 INFO:root:[step 776999] mlm_loss=1.51045 mlm_acc=67.27825 nsp_loss=0.04113 nsp_acc=98.516 throughput=139.0K tks/s lr=0.0000223 time=135.71 INFO:root:[step 777249] mlm_loss=1.46856 mlm_acc=68.41852 nsp_loss=0.03951 nsp_acc=98.565 throughput=146.0K tks/s lr=0.0000223 time=146.30 INFO:root:[step 777499] mlm_loss=1.51884 mlm_acc=67.24541 nsp_loss=0.02206 nsp_acc=99.250 throughput=129.0K tks/s lr=0.0000223 time=127.54 INFO:root:[step 777749] mlm_loss=1.39047 mlm_acc=68.24227 nsp_loss=0.03098 nsp_acc=98.878 throughput=125.0K tks/s lr=0.0000222 time=111.86 INFO:root:[step 777999] mlm_loss=1.49248 mlm_acc=66.76408 nsp_loss=0.02401 nsp_acc=99.154 throughput=133.0K tks/s lr=0.0000222 time=133.54 INFO:root:[step 778249] mlm_loss=1.36041 mlm_acc=68.75345 nsp_loss=0.02901 nsp_acc=98.977 throughput=123.0K tks/s lr=0.0000222 time=111.81 INFO:root:[step 778499] mlm_loss=1.36314 mlm_acc=68.86525 nsp_loss=0.02674 nsp_acc=99.059 throughput=119.0K tks/s lr=0.0000222 time=109.52 INFO:root:[step 778749] mlm_loss=1.63171 mlm_acc=65.06724 nsp_loss=0.03082 nsp_acc=98.805 throughput=148.0K tks/s lr=0.0000221 time=159.73 INFO:root:[step 778999] mlm_loss=1.68789 mlm_acc=64.18940 nsp_loss=0.02274 nsp_acc=99.163 throughput=155.0K tks/s lr=0.0000221 time=157.80 INFO:root:[step 779249] mlm_loss=1.77322 mlm_acc=63.53855 nsp_loss=0.03486 nsp_acc=98.654 throughput=145.0K tks/s lr=0.0000221 time=144.40 INFO:root:[step 779499] mlm_loss=1.38086 mlm_acc=68.24112 nsp_loss=0.02719 nsp_acc=99.049 throughput=123.0K tks/s lr=0.0000221 time=121.32 INFO:root:[step 779749] mlm_loss=1.43859 mlm_acc=67.95768 nsp_loss=0.02296 nsp_acc=99.200 throughput=125.0K tks/s lr=0.0000220 time=124.36 INFO:root:[step 779999] mlm_loss=1.73004 mlm_acc=63.87583 nsp_loss=0.03323 nsp_acc=98.763 throughput=148.0K tks/s lr=0.0000220 time=145.96 INFO:root:[step 779999] Saving checkpoints to /home/ubuntu/ckpt-master/0779999.params, /home/ubuntu/ckpt-master/0779999.states. INFO:root:[step 780249] mlm_loss=1.80512 mlm_acc=63.42902 nsp_loss=0.03337 nsp_acc=98.692 throughput=133.0K tks/s lr=0.0000220 time=157.75 INFO:root:[step 780499] mlm_loss=1.42213 mlm_acc=67.90492 nsp_loss=0.02633 nsp_acc=99.043 throughput=131.0K tks/s lr=0.0000220 time=120.73 INFO:root:[step 780749] mlm_loss=1.56449 mlm_acc=65.55813 nsp_loss=0.12023 nsp_acc=94.890 throughput=137.0K tks/s lr=0.0000219 time=138.84 INFO:root:[step 780999] mlm_loss=1.50445 mlm_acc=66.64279 nsp_loss=0.03693 nsp_acc=98.585 throughput=130.0K tks/s lr=0.0000219 time=137.13 INFO:root:[step 781249] mlm_loss=1.42225 mlm_acc=67.65866 nsp_loss=0.02573 nsp_acc=99.121 throughput=125.0K tks/s lr=0.0000219 time=125.68 INFO:root:[step 781499] mlm_loss=1.50416 mlm_acc=67.15465 nsp_loss=0.02569 nsp_acc=99.136 throughput=139.0K tks/s lr=0.0000219 time=120.75 INFO:root:[step 781749] mlm_loss=1.49266 mlm_acc=67.40728 nsp_loss=0.02236 nsp_acc=99.259 throughput=133.0K tks/s lr=0.0000218 time=130.14 INFO:root:[step 781999] mlm_loss=1.55040 mlm_acc=65.99714 nsp_loss=0.03206 nsp_acc=98.786 throughput=148.0K tks/s lr=0.0000218 time=147.73 INFO:root:[step 782249] mlm_loss=1.36330 mlm_acc=68.85517 nsp_loss=0.03096 nsp_acc=98.906 throughput=118.0K tks/s lr=0.0000218 time=111.51 INFO:root:[step 782499] mlm_loss=1.49013 mlm_acc=65.81096 nsp_loss=0.03916 nsp_acc=98.558 throughput=133.0K tks/s lr=0.0000218 time=136.50 INFO:root:[step 782749] mlm_loss=1.03214 mlm_acc=77.01738 nsp_loss=0.04077 nsp_acc=98.633 throughput=142.0K tks/s lr=0.0000217 time=140.53 INFO:root:[step 782999] mlm_loss=1.42283 mlm_acc=70.08606 nsp_loss=0.02534 nsp_acc=99.133 throughput=144.0K tks/s lr=0.0000217 time=142.58 INFO:root:[step 783249] mlm_loss=1.48202 mlm_acc=67.43723 nsp_loss=0.02452 nsp_acc=99.141 throughput=123.0K tks/s lr=0.0000217 time=127.72 INFO:root:[step 783499] mlm_loss=1.38826 mlm_acc=68.56660 nsp_loss=0.02703 nsp_acc=99.089 throughput=125.0K tks/s lr=0.0000217 time=111.75 INFO:root:[step 783749] mlm_loss=1.49808 mlm_acc=67.57832 nsp_loss=0.02318 nsp_acc=99.185 throughput=128.0K tks/s lr=0.0000216 time=126.30 INFO:root:[step 783999] mlm_loss=1.59620 mlm_acc=66.41750 nsp_loss=0.01756 nsp_acc=99.381 throughput=136.0K tks/s lr=0.0000216 time=140.27 INFO:root:[step 784249] mlm_loss=1.36791 mlm_acc=68.53485 nsp_loss=0.03234 nsp_acc=98.859 throughput=118.0K tks/s lr=0.0000216 time=108.61 INFO:root:[step 784499] mlm_loss=1.37133 mlm_acc=68.79810 nsp_loss=0.03063 nsp_acc=98.950 throughput=123.0K tks/s lr=0.0000216 time=108.30 INFO:root:[step 784749] mlm_loss=1.50566 mlm_acc=67.29184 nsp_loss=0.02137 nsp_acc=99.277 throughput=133.0K tks/s lr=0.0000215 time=133.31 INFO:root:[step 784999] mlm_loss=1.51675 mlm_acc=66.61851 nsp_loss=0.06790 nsp_acc=97.187 throughput=130.0K tks/s lr=0.0000215 time=129.33 INFO:root:[step 784999] Saving checkpoints to /home/ubuntu/ckpt-master/0784999.params, /home/ubuntu/ckpt-master/0784999.states. INFO:root:[step 785249] mlm_loss=1.60637 mlm_acc=65.70524 nsp_loss=0.02906 nsp_acc=98.965 throughput=135.0K tks/s lr=0.0000215 time=164.50 INFO:root:[step 785499] mlm_loss=1.52128 mlm_acc=67.44094 nsp_loss=0.01980 nsp_acc=99.302 throughput=141.0K tks/s lr=0.0000215 time=122.12 INFO:root:[step 785749] mlm_loss=1.79745 mlm_acc=62.51279 nsp_loss=0.04832 nsp_acc=98.048 throughput=153.0K tks/s lr=0.0000214 time=168.94 INFO:root:[step 785999] mlm_loss=1.62502 mlm_acc=66.07685 nsp_loss=0.01696 nsp_acc=99.405 throughput=146.0K tks/s lr=0.0000214 time=143.27 INFO:root:[step 786249] mlm_loss=1.43539 mlm_acc=66.91212 nsp_loss=0.03109 nsp_acc=98.888 throughput=136.0K tks/s lr=0.0000214 time=137.45 INFO:root:[step 786499] mlm_loss=1.35095 mlm_acc=69.14422 nsp_loss=0.03307 nsp_acc=98.790 throughput=120.0K tks/s lr=0.0000214 time=118.98 INFO:root:[step 786749] mlm_loss=1.40724 mlm_acc=68.29214 nsp_loss=0.02677 nsp_acc=99.049 throughput=127.0K tks/s lr=0.0000213 time=110.93 INFO:root:[step 786999] mlm_loss=1.42730 mlm_acc=68.44719 nsp_loss=0.02468 nsp_acc=99.116 throughput=132.0K tks/s lr=0.0000213 time=114.42 INFO:root:[step 787249] mlm_loss=1.63665 mlm_acc=65.86522 nsp_loss=0.01764 nsp_acc=99.371 throughput=142.0K tks/s lr=0.0000213 time=151.53 INFO:root:[step 787499] mlm_loss=1.69741 mlm_acc=63.22755 nsp_loss=0.04072 nsp_acc=98.482 throughput=149.0K tks/s lr=0.0000213 time=156.82 INFO:root:[step 787749] mlm_loss=1.50888 mlm_acc=65.71803 nsp_loss=0.03185 nsp_acc=98.865 throughput=142.0K tks/s lr=0.0000212 time=139.48 INFO:root:[step 787999] mlm_loss=1.57616 mlm_acc=66.92978 nsp_loss=0.01940 nsp_acc=99.341 throughput=136.0K tks/s lr=0.0000212 time=136.28 INFO:root:[step 788249] mlm_loss=1.46384 mlm_acc=67.86415 nsp_loss=0.02560 nsp_acc=99.125 throughput=135.0K tks/s lr=0.0000212 time=115.66 INFO:root:[step 788499] mlm_loss=1.62992 mlm_acc=65.73629 nsp_loss=0.02133 nsp_acc=99.257 throughput=153.0K tks/s lr=0.0000212 time=151.95 INFO:root:[step 788749] mlm_loss=1.47042 mlm_acc=66.48611 nsp_loss=0.03960 nsp_acc=98.546 throughput=137.0K tks/s lr=0.0000211 time=137.19 INFO:root:[step 788999] mlm_loss=1.48035 mlm_acc=67.38036 nsp_loss=0.02507 nsp_acc=99.181 throughput=127.0K tks/s lr=0.0000211 time=128.59 INFO:root:[step 789249] mlm_loss=1.40516 mlm_acc=68.31415 nsp_loss=0.02706 nsp_acc=99.077 throughput=129.0K tks/s lr=0.0000211 time=111.54 INFO:root:[step 789499] mlm_loss=1.48414 mlm_acc=66.64520 nsp_loss=0.03656 nsp_acc=98.662 throughput=126.0K tks/s lr=0.0000211 time=124.69 INFO:root:[step 789749] mlm_loss=1.57058 mlm_acc=65.95445 nsp_loss=0.02743 nsp_acc=98.996 throughput=133.0K tks/s lr=0.0000210 time=136.39 INFO:root:[step 789999] mlm_loss=1.32278 mlm_acc=69.25950 nsp_loss=0.02859 nsp_acc=99.030 throughput=122.0K tks/s lr=0.0000210 time=109.34 INFO:root:[step 789999] Saving checkpoints to /home/ubuntu/ckpt-master/0789999.params, /home/ubuntu/ckpt-master/0789999.states. INFO:root:[step 790249] mlm_loss=1.34494 mlm_acc=68.96648 nsp_loss=0.03095 nsp_acc=98.918 throughput=105.0K tks/s lr=0.0000210 time=124.74 INFO:root:[step 790499] mlm_loss=1.39250 mlm_acc=67.61986 nsp_loss=0.04104 nsp_acc=98.462 throughput=121.0K tks/s lr=0.0000210 time=120.52 INFO:root:[step 790749] mlm_loss=1.42809 mlm_acc=66.49648 nsp_loss=0.04713 nsp_acc=98.314 throughput=132.0K tks/s lr=0.0000209 time=124.59 INFO:root:[step 790999] mlm_loss=1.75897 mlm_acc=63.16972 nsp_loss=0.03948 nsp_acc=98.504 throughput=147.0K tks/s lr=0.0000209 time=161.35 INFO:root:[step 791249] mlm_loss=1.44359 mlm_acc=68.17453 nsp_loss=0.02523 nsp_acc=99.115 throughput=130.0K tks/s lr=0.0000209 time=118.12 INFO:root:[step 791499] mlm_loss=1.37390 mlm_acc=68.81929 nsp_loss=0.02811 nsp_acc=99.034 throughput=111.0K tks/s lr=0.0000209 time=116.01 INFO:root:[step 791749] mlm_loss=1.49939 mlm_acc=67.54765 nsp_loss=0.02524 nsp_acc=99.134 throughput=132.0K tks/s lr=0.0000208 time=119.20 INFO:root:[step 791999] mlm_loss=1.63385 mlm_acc=64.70835 nsp_loss=0.04334 nsp_acc=98.338 throughput=136.0K tks/s lr=0.0000208 time=132.53 INFO:root:[step 792249] mlm_loss=1.36534 mlm_acc=69.07680 nsp_loss=0.03122 nsp_acc=98.903 throughput=115.0K tks/s lr=0.0000208 time=106.46 INFO:root:[step 792499] mlm_loss=1.73076 mlm_acc=63.70928 nsp_loss=0.05580 nsp_acc=97.782 throughput=133.0K tks/s lr=0.0000208 time=133.27 INFO:root:[step 792749] mlm_loss=1.56718 mlm_acc=67.05305 nsp_loss=0.01919 nsp_acc=99.325 throughput=140.0K tks/s lr=0.0000207 time=135.25 INFO:root:[step 792999] mlm_loss=1.56049 mlm_acc=66.56433 nsp_loss=0.02033 nsp_acc=99.303 throughput=136.0K tks/s lr=0.0000207 time=136.46 INFO:root:[step 793249] mlm_loss=1.25572 mlm_acc=69.32741 nsp_loss=0.03993 nsp_acc=98.629 throughput=115.0K tks/s lr=0.0000207 time=108.54 INFO:root:[step 793499] mlm_loss=1.40098 mlm_acc=66.97587 nsp_loss=0.04005 nsp_acc=98.568 throughput=139.0K tks/s lr=0.0000207 time=137.72 INFO:root:[step 793749] mlm_loss=1.55525 mlm_acc=65.89056 nsp_loss=0.03911 nsp_acc=98.597 throughput=135.0K tks/s lr=0.0000206 time=137.43 INFO:root:[step 793999] mlm_loss=1.35533 mlm_acc=68.27482 nsp_loss=0.03066 nsp_acc=98.956 throughput=130.0K tks/s lr=0.0000206 time=111.91 INFO:root:[step 794249] mlm_loss=1.51520 mlm_acc=67.17462 nsp_loss=0.01992 nsp_acc=99.317 throughput=131.0K tks/s lr=0.0000206 time=132.33 INFO:root:[step 794499] mlm_loss=1.47051 mlm_acc=66.94330 nsp_loss=0.02342 nsp_acc=99.172 throughput=128.0K tks/s lr=0.0000206 time=129.64 INFO:root:[step 794749] mlm_loss=1.33963 mlm_acc=68.76893 nsp_loss=0.03292 nsp_acc=98.812 throughput=119.0K tks/s lr=0.0000205 time=109.00 INFO:root:[step 794999] mlm_loss=1.50659 mlm_acc=67.16240 nsp_loss=0.01882 nsp_acc=99.336 throughput=138.0K tks/s lr=0.0000205 time=130.31 INFO:root:[step 794999] Saving checkpoints to /home/ubuntu/ckpt-master/0794999.params, /home/ubuntu/ckpt-master/0794999.states. INFO:root:[step 795249] mlm_loss=1.51273 mlm_acc=67.17203 nsp_loss=0.02426 nsp_acc=99.144 throughput=119.0K tks/s lr=0.0000205 time=136.81 INFO:root:[step 795499] mlm_loss=1.51132 mlm_acc=65.83290 nsp_loss=0.03469 nsp_acc=98.721 throughput=142.0K tks/s lr=0.0000205 time=142.18 INFO:root:[step 795749] mlm_loss=1.44567 mlm_acc=67.52425 nsp_loss=0.03348 nsp_acc=98.788 throughput=123.0K tks/s lr=0.0000204 time=127.24 INFO:root:[step 795999] mlm_loss=1.31783 mlm_acc=68.66481 nsp_loss=0.04116 nsp_acc=98.471 throughput=117.0K tks/s lr=0.0000204 time=107.54 INFO:root:[step 796249] mlm_loss=1.36171 mlm_acc=69.08155 nsp_loss=0.02924 nsp_acc=98.981 throughput=123.0K tks/s lr=0.0000204 time=107.87 INFO:root:[step 796499] mlm_loss=1.34327 mlm_acc=68.95691 nsp_loss=0.02874 nsp_acc=99.025 throughput=112.0K tks/s lr=0.0000204 time=116.60 INFO:root:[step 796749] mlm_loss=1.59441 mlm_acc=64.96233 nsp_loss=0.04725 nsp_acc=98.213 throughput=132.0K tks/s lr=0.0000203 time=114.77 INFO:root:[step 796999] mlm_loss=1.71592 mlm_acc=63.62323 nsp_loss=0.02562 nsp_acc=99.097 throughput=148.0K tks/s lr=0.0000203 time=144.85 INFO:root:[step 797249] mlm_loss=1.37077 mlm_acc=68.24937 nsp_loss=0.02696 nsp_acc=99.085 throughput=116.0K tks/s lr=0.0000203 time=122.84 INFO:root:[step 797499] mlm_loss=1.48401 mlm_acc=66.05662 nsp_loss=0.05750 nsp_acc=97.749 throughput=138.0K tks/s lr=0.0000203 time=122.38 INFO:root:[step 797749] mlm_loss=1.56899 mlm_acc=65.80782 nsp_loss=0.03557 nsp_acc=98.676 throughput=144.0K tks/s lr=0.0000202 time=143.65 INFO:root:[step 797999] mlm_loss=1.59448 mlm_acc=66.60486 nsp_loss=0.01964 nsp_acc=99.287 throughput=143.0K tks/s lr=0.0000202 time=137.67 INFO:root:[step 798249] mlm_loss=1.64996 mlm_acc=65.42564 nsp_loss=0.03027 nsp_acc=98.860 throughput=146.0K tks/s lr=0.0000202 time=155.40 INFO:root:[step 798499] mlm_loss=1.55207 mlm_acc=67.38446 nsp_loss=0.01825 nsp_acc=99.399 throughput=142.0K tks/s lr=0.0000202 time=140.10 INFO:root:[step 798749] mlm_loss=1.60931 mlm_acc=65.21120 nsp_loss=0.02403 nsp_acc=99.101 throughput=147.0K tks/s lr=0.0000201 time=150.14 INFO:root:[step 798999] mlm_loss=1.48763 mlm_acc=67.70961 nsp_loss=0.02144 nsp_acc=99.245 throughput=137.0K tks/s lr=0.0000201 time=117.65 INFO:root:[step 799249] mlm_loss=1.13522 mlm_acc=70.89374 nsp_loss=0.04144 nsp_acc=98.506 throughput=103.0K tks/s lr=0.0000201 time=100.93 INFO:root:[step 799499] mlm_loss=1.51327 mlm_acc=65.79611 nsp_loss=0.03743 nsp_acc=98.634 throughput=139.0K tks/s lr=0.0000201 time=139.02 INFO:root:[step 799749] mlm_loss=1.60157 mlm_acc=66.07337 nsp_loss=0.01691 nsp_acc=99.419 throughput=147.0K tks/s lr=0.0000200 time=139.75 INFO:root:[step 799999] mlm_loss=1.45308 mlm_acc=67.61479 nsp_loss=0.02433 nsp_acc=99.166 throughput=128.0K tks/s lr=0.0000200 time=127.53 INFO:root:[step 799999] Saving checkpoints to /home/ubuntu/ckpt-master/0799999.params, /home/ubuntu/ckpt-master/0799999.states. INFO:root:[step 800249] mlm_loss=1.55143 mlm_acc=65.01955 nsp_loss=0.02317 nsp_acc=99.157 throughput=126.0K tks/s lr=0.0000200 time=155.28 INFO:root:[step 800499] mlm_loss=1.38620 mlm_acc=68.60199 nsp_loss=0.02807 nsp_acc=99.019 throughput=126.0K tks/s lr=0.0000200 time=109.61 INFO:root:[step 800749] mlm_loss=1.52304 mlm_acc=67.27062 nsp_loss=0.02385 nsp_acc=99.156 throughput=131.0K tks/s lr=0.0000199 time=127.58 INFO:root:[step 800999] mlm_loss=1.42929 mlm_acc=67.84618 nsp_loss=0.03519 nsp_acc=98.696 throughput=126.0K tks/s lr=0.0000199 time=122.87 INFO:root:[step 801249] mlm_loss=1.54347 mlm_acc=66.33127 nsp_loss=0.06013 nsp_acc=97.629 throughput=151.0K tks/s lr=0.0000199 time=154.34 INFO:root:[step 801499] mlm_loss=1.70300 mlm_acc=64.00753 nsp_loss=0.03116 nsp_acc=98.854 throughput=158.0K tks/s lr=0.0000199 time=160.56 INFO:root:[step 801749] mlm_loss=1.45916 mlm_acc=67.90623 nsp_loss=0.02754 nsp_acc=98.990 throughput=125.0K tks/s lr=0.0000198 time=127.42 INFO:root:[step 801999] mlm_loss=1.55216 mlm_acc=66.44173 nsp_loss=0.02105 nsp_acc=99.237 throughput=141.0K tks/s lr=0.0000198 time=133.15 INFO:root:[step 802249] mlm_loss=1.45250 mlm_acc=67.56579 nsp_loss=0.02447 nsp_acc=99.151 throughput=134.0K tks/s lr=0.0000198 time=118.70 INFO:root:[step 802499] mlm_loss=1.39940 mlm_acc=68.48720 nsp_loss=0.02907 nsp_acc=99.014 throughput=119.0K tks/s lr=0.0000198 time=118.85 INFO:root:[step 802749] mlm_loss=1.47367 mlm_acc=66.73941 nsp_loss=0.07146 nsp_acc=97.030 throughput=137.0K tks/s lr=0.0000197 time=133.16 INFO:root:[step 802999] mlm_loss=1.57183 mlm_acc=66.80960 nsp_loss=0.01959 nsp_acc=99.331 throughput=144.0K tks/s lr=0.0000197 time=129.47 INFO:root:[step 803249] mlm_loss=1.42140 mlm_acc=66.64681 nsp_loss=0.02733 nsp_acc=99.054 throughput=134.0K tks/s lr=0.0000197 time=131.20 INFO:root:[step 803499] mlm_loss=1.41065 mlm_acc=67.97387 nsp_loss=0.02737 nsp_acc=99.021 throughput=122.0K tks/s lr=0.0000197 time=126.55 INFO:root:[step 803749] mlm_loss=1.36461 mlm_acc=68.99606 nsp_loss=0.03140 nsp_acc=98.915 throughput=120.0K tks/s lr=0.0000196 time=110.54 INFO:root:[step 803999] mlm_loss=1.40396 mlm_acc=68.32329 nsp_loss=0.02955 nsp_acc=98.957 throughput=120.0K tks/s lr=0.0000196 time=119.87 INFO:root:[step 804249] mlm_loss=1.43470 mlm_acc=68.17040 nsp_loss=0.02737 nsp_acc=99.047 throughput=128.0K tks/s lr=0.0000196 time=113.16 INFO:root:[step 804499] mlm_loss=1.52540 mlm_acc=67.19807 nsp_loss=0.03202 nsp_acc=98.823 throughput=135.0K tks/s lr=0.0000196 time=131.23 INFO:root:[step 804749] mlm_loss=1.52115 mlm_acc=66.73818 nsp_loss=0.04073 nsp_acc=98.393 throughput=143.0K tks/s lr=0.0000195 time=129.12 INFO:root:[step 804999] mlm_loss=1.53741 mlm_acc=67.47315 nsp_loss=0.02112 nsp_acc=99.265 throughput=134.0K tks/s lr=0.0000195 time=129.39 INFO:root:[step 804999] Saving checkpoints to /home/ubuntu/ckpt-master/0804999.params, /home/ubuntu/ckpt-master/0804999.states. INFO:root:[step 805249] mlm_loss=1.48874 mlm_acc=66.24146 nsp_loss=0.05175 nsp_acc=98.000 throughput=123.0K tks/s lr=0.0000195 time=153.60 INFO:root:[step 805499] mlm_loss=1.35520 mlm_acc=68.71563 nsp_loss=0.02901 nsp_acc=99.005 throughput=124.0K tks/s lr=0.0000195 time=109.44 INFO:root:[step 805749] mlm_loss=1.71970 mlm_acc=63.37526 nsp_loss=0.07151 nsp_acc=97.061 throughput=143.0K tks/s lr=0.0000194 time=159.71 INFO:root:[step 805999] mlm_loss=1.41163 mlm_acc=68.24030 nsp_loss=0.02757 nsp_acc=99.026 throughput=128.0K tks/s lr=0.0000194 time=113.14 INFO:root:[step 806249] mlm_loss=1.57712 mlm_acc=64.76288 nsp_loss=0.04846 nsp_acc=98.130 throughput=134.0K tks/s lr=0.0000194 time=132.57 INFO:root:[step 806499] mlm_loss=1.29395 mlm_acc=69.44850 nsp_loss=0.03442 nsp_acc=98.799 throughput=121.0K tks/s lr=0.0000194 time=108.17 INFO:root:[step 806749] mlm_loss=1.46560 mlm_acc=67.47434 nsp_loss=0.02313 nsp_acc=99.178 throughput=129.0K tks/s lr=0.0000193 time=127.73 INFO:root:[step 806999] mlm_loss=1.33320 mlm_acc=69.08910 nsp_loss=0.03163 nsp_acc=98.898 throughput=123.0K tks/s lr=0.0000193 time=108.66 INFO:root:[step 807249] mlm_loss=1.45637 mlm_acc=67.80601 nsp_loss=0.02681 nsp_acc=99.051 throughput=123.0K tks/s lr=0.0000193 time=122.74 INFO:root:[step 807499] mlm_loss=1.57535 mlm_acc=66.01207 nsp_loss=0.03455 nsp_acc=98.659 throughput=150.0K tks/s lr=0.0000193 time=147.12 INFO:root:[step 807749] mlm_loss=1.58676 mlm_acc=65.96719 nsp_loss=0.04041 nsp_acc=98.460 throughput=151.0K tks/s lr=0.0000192 time=153.44 INFO:root:[step 807999] mlm_loss=1.46028 mlm_acc=68.12415 nsp_loss=0.02581 nsp_acc=99.112 throughput=132.0K tks/s lr=0.0000192 time=113.68 INFO:root:[step 808249] mlm_loss=1.64475 mlm_acc=65.28696 nsp_loss=0.04778 nsp_acc=98.094 throughput=144.0K tks/s lr=0.0000192 time=159.43 INFO:root:[step 808499] mlm_loss=1.55079 mlm_acc=67.33499 nsp_loss=0.02280 nsp_acc=99.206 throughput=141.0K tks/s lr=0.0000192 time=122.80 INFO:root:[step 808749] mlm_loss=1.46088 mlm_acc=65.93338 nsp_loss=0.03049 nsp_acc=98.899 throughput=128.0K tks/s lr=0.0000191 time=126.64 INFO:root:[step 808999] mlm_loss=1.45164 mlm_acc=66.16582 nsp_loss=0.03681 nsp_acc=98.636 throughput=123.0K tks/s lr=0.0000191 time=127.42 INFO:root:[step 809249] mlm_loss=1.57630 mlm_acc=64.98523 nsp_loss=0.02810 nsp_acc=99.035 throughput=142.0K tks/s lr=0.0000191 time=142.14 INFO:root:[step 809499] mlm_loss=1.55053 mlm_acc=65.35489 nsp_loss=0.03848 nsp_acc=98.556 throughput=145.0K tks/s lr=0.0000191 time=124.50 INFO:root:[step 809749] mlm_loss=1.57859 mlm_acc=65.82760 nsp_loss=0.04206 nsp_acc=98.339 throughput=142.0K tks/s lr=0.0000190 time=158.50 INFO:root:[step 809999] mlm_loss=1.43436 mlm_acc=67.47973 nsp_loss=0.02504 nsp_acc=99.091 throughput=137.0K tks/s lr=0.0000190 time=116.90 INFO:root:[step 809999] Saving checkpoints to /home/ubuntu/ckpt-master/0809999.params, /home/ubuntu/ckpt-master/0809999.states. INFO:root:[step 810249] mlm_loss=1.85506 mlm_acc=62.90761 nsp_loss=0.04904 nsp_acc=98.080 throughput=120.0K tks/s lr=0.0000190 time=149.59 INFO:root:[step 810499] mlm_loss=1.52929 mlm_acc=67.33411 nsp_loss=0.02302 nsp_acc=99.202 throughput=128.0K tks/s lr=0.0000190 time=129.51 INFO:root:[step 810749] mlm_loss=1.52020 mlm_acc=67.16420 nsp_loss=0.02285 nsp_acc=99.178 throughput=139.0K tks/s lr=0.0000189 time=121.81 INFO:root:[step 810999] mlm_loss=1.50953 mlm_acc=65.77567 nsp_loss=0.04200 nsp_acc=98.493 throughput=128.0K tks/s lr=0.0000189 time=126.45 INFO:root:[step 811249] mlm_loss=1.70447 mlm_acc=64.43423 nsp_loss=0.05314 nsp_acc=97.824 throughput=149.0K tks/s lr=0.0000189 time=152.62 INFO:root:[step 811499] mlm_loss=1.39189 mlm_acc=68.64476 nsp_loss=0.02634 nsp_acc=99.052 throughput=117.0K tks/s lr=0.0000189 time=120.89 INFO:root:[step 811749] mlm_loss=1.46656 mlm_acc=67.81680 nsp_loss=0.02615 nsp_acc=99.079 throughput=133.0K tks/s lr=0.0000188 time=113.92 INFO:root:[step 811999] mlm_loss=1.46729 mlm_acc=67.99578 nsp_loss=0.02630 nsp_acc=99.067 throughput=122.0K tks/s lr=0.0000188 time=123.65 INFO:root:[step 812249] mlm_loss=1.45229 mlm_acc=67.88915 nsp_loss=0.02860 nsp_acc=98.977 throughput=133.0K tks/s lr=0.0000188 time=114.14 INFO:root:[step 812499] mlm_loss=1.47228 mlm_acc=66.62246 nsp_loss=0.03964 nsp_acc=98.517 throughput=138.0K tks/s lr=0.0000188 time=139.33 INFO:root:[step 812749] mlm_loss=1.57805 mlm_acc=64.97144 nsp_loss=0.02822 nsp_acc=98.991 throughput=151.0K tks/s lr=0.0000187 time=144.85 INFO:root:[step 812999] mlm_loss=1.57389 mlm_acc=66.02692 nsp_loss=0.02176 nsp_acc=99.209 throughput=136.0K tks/s lr=0.0000187 time=138.20 INFO:root:[step 813249] mlm_loss=1.48661 mlm_acc=68.33463 nsp_loss=0.02073 nsp_acc=99.344 throughput=137.0K tks/s lr=0.0000187 time=136.00 INFO:root:[step 813499] mlm_loss=1.45001 mlm_acc=68.24442 nsp_loss=0.02426 nsp_acc=99.169 throughput=124.0K tks/s lr=0.0000187 time=122.98 INFO:root:[step 813749] mlm_loss=1.50192 mlm_acc=67.80998 nsp_loss=0.02374 nsp_acc=99.173 throughput=134.0K tks/s lr=0.0000186 time=119.67 INFO:root:[step 813999] mlm_loss=1.61260 mlm_acc=64.83298 nsp_loss=0.05760 nsp_acc=97.783 throughput=150.0K tks/s lr=0.0000186 time=167.47 INFO:root:[step 814249] mlm_loss=1.53105 mlm_acc=66.19728 nsp_loss=0.04962 nsp_acc=98.008 throughput=144.0K tks/s lr=0.0000186 time=125.82 INFO:root:[step 814499] mlm_loss=1.37254 mlm_acc=68.14362 nsp_loss=0.03476 nsp_acc=98.754 throughput=121.0K tks/s lr=0.0000186 time=123.36 INFO:root:[step 814749] mlm_loss=1.56830 mlm_acc=67.03519 nsp_loss=0.01879 nsp_acc=99.363 throughput=136.0K tks/s lr=0.0000185 time=134.13 INFO:root:[step 814999] mlm_loss=1.58292 mlm_acc=66.83910 nsp_loss=0.01974 nsp_acc=99.294 throughput=145.0K tks/s lr=0.0000185 time=128.83 INFO:root:[step 814999] Saving checkpoints to /home/ubuntu/ckpt-master/0814999.params, /home/ubuntu/ckpt-master/0814999.states. INFO:root:[step 815249] mlm_loss=1.42463 mlm_acc=67.73542 nsp_loss=0.03765 nsp_acc=98.598 throughput=114.0K tks/s lr=0.0000185 time=144.26 INFO:root:[step 815499] mlm_loss=1.57604 mlm_acc=66.62639 nsp_loss=0.03301 nsp_acc=98.794 throughput=143.0K tks/s lr=0.0000185 time=145.56 INFO:root:[step 815749] mlm_loss=1.49759 mlm_acc=67.27292 nsp_loss=0.02354 nsp_acc=99.191 throughput=130.0K tks/s lr=0.0000184 time=129.44 INFO:root:[step 815999] mlm_loss=1.62068 mlm_acc=65.02196 nsp_loss=0.02424 nsp_acc=99.110 throughput=147.0K tks/s lr=0.0000184 time=151.36 INFO:root:[step 816249] mlm_loss=1.44861 mlm_acc=68.00069 nsp_loss=0.02716 nsp_acc=99.066 throughput=130.0K tks/s lr=0.0000184 time=115.13 INFO:root:[step 816499] mlm_loss=1.64456 mlm_acc=65.27324 nsp_loss=0.04851 nsp_acc=98.077 throughput=137.0K tks/s lr=0.0000184 time=154.30 INFO:root:[step 816749] mlm_loss=1.50659 mlm_acc=67.61439 nsp_loss=0.02067 nsp_acc=99.237 throughput=140.0K tks/s lr=0.0000183 time=122.38 INFO:root:[step 816999] mlm_loss=1.36361 mlm_acc=68.90084 nsp_loss=0.03121 nsp_acc=98.875 throughput=114.0K tks/s lr=0.0000183 time=120.63 INFO:root:[step 817249] mlm_loss=1.36460 mlm_acc=68.11615 nsp_loss=0.04884 nsp_acc=98.117 throughput=136.0K tks/s lr=0.0000183 time=117.36 INFO:root:[step 817499] mlm_loss=1.45632 mlm_acc=68.96377 nsp_loss=0.03652 nsp_acc=98.663 throughput=142.0K tks/s lr=0.0000183 time=139.65 INFO:root:[step 817749] mlm_loss=1.36672 mlm_acc=69.75554 nsp_loss=0.03111 nsp_acc=98.926 throughput=121.0K tks/s lr=0.0000182 time=127.70 INFO:root:[step 817999] mlm_loss=1.27863 mlm_acc=69.55682 nsp_loss=0.03393 nsp_acc=98.841 throughput=114.0K tks/s lr=0.0000182 time=105.35 INFO:root:[step 818249] mlm_loss=1.47293 mlm_acc=65.83750 nsp_loss=0.04743 nsp_acc=98.241 throughput=142.0K tks/s lr=0.0000182 time=137.37 INFO:root:[step 818499] mlm_loss=1.42051 mlm_acc=67.79311 nsp_loss=0.02534 nsp_acc=99.132 throughput=136.0K tks/s lr=0.0000182 time=121.22 INFO:root:[step 818749] mlm_loss=1.52857 mlm_acc=67.31551 nsp_loss=0.02335 nsp_acc=99.133 throughput=134.0K tks/s lr=0.0000181 time=131.20 INFO:root:[step 818999] mlm_loss=1.70829 mlm_acc=64.55523 nsp_loss=0.04334 nsp_acc=98.266 throughput=142.0K tks/s lr=0.0000181 time=137.34 INFO:root:[step 819249] mlm_loss=1.61067 mlm_acc=66.50910 nsp_loss=0.01640 nsp_acc=99.432 throughput=148.0K tks/s lr=0.0000181 time=143.58 INFO:root:[step 819499] mlm_loss=1.57464 mlm_acc=66.75192 nsp_loss=0.01662 nsp_acc=99.429 throughput=143.0K tks/s lr=0.0000181 time=138.43 INFO:root:[step 819749] mlm_loss=1.30411 mlm_acc=69.37115 nsp_loss=0.03249 nsp_acc=98.872 throughput=113.0K tks/s lr=0.0000180 time=117.09 INFO:root:[step 819999] mlm_loss=1.44058 mlm_acc=68.13356 nsp_loss=0.02593 nsp_acc=99.082 throughput=132.0K tks/s lr=0.0000180 time=120.13 INFO:root:[step 819999] Saving checkpoints to /home/ubuntu/ckpt-master/0819999.params, /home/ubuntu/ckpt-master/0819999.states. INFO:root:[step 820249] mlm_loss=1.47868 mlm_acc=67.79971 nsp_loss=0.02285 nsp_acc=99.198 throughput=116.0K tks/s lr=0.0000180 time=138.66 INFO:root:[step 820499] mlm_loss=1.55488 mlm_acc=66.77072 nsp_loss=0.02005 nsp_acc=99.271 throughput=139.0K tks/s lr=0.0000180 time=140.24 INFO:root:[step 820749] mlm_loss=1.51055 mlm_acc=66.43989 nsp_loss=0.05901 nsp_acc=97.715 throughput=144.0K tks/s lr=0.0000179 time=142.77 INFO:root:[step 820999] mlm_loss=1.45402 mlm_acc=66.66829 nsp_loss=0.05603 nsp_acc=97.796 throughput=134.0K tks/s lr=0.0000179 time=122.21 INFO:root:[step 821249] mlm_loss=1.52809 mlm_acc=66.29872 nsp_loss=0.02805 nsp_acc=98.991 throughput=141.0K tks/s lr=0.0000179 time=138.78 INFO:root:[step 821499] mlm_loss=1.70977 mlm_acc=63.88911 nsp_loss=0.02602 nsp_acc=99.025 throughput=152.0K tks/s lr=0.0000179 time=166.37 INFO:root:[step 821749] mlm_loss=1.59521 mlm_acc=65.61386 nsp_loss=0.02941 nsp_acc=98.915 throughput=148.0K tks/s lr=0.0000178 time=150.19 INFO:root:[step 821999] mlm_loss=1.51974 mlm_acc=67.33267 nsp_loss=0.02516 nsp_acc=99.116 throughput=135.0K tks/s lr=0.0000178 time=125.55 INFO:root:[step 822249] mlm_loss=1.59562 mlm_acc=65.82473 nsp_loss=0.03364 nsp_acc=98.746 throughput=144.0K tks/s lr=0.0000178 time=142.63 INFO:root:[step 822499] mlm_loss=1.49350 mlm_acc=65.95321 nsp_loss=0.03316 nsp_acc=98.799 throughput=139.0K tks/s lr=0.0000178 time=128.40 INFO:root:[step 822749] mlm_loss=1.13808 mlm_acc=71.02379 nsp_loss=0.04476 nsp_acc=98.457 throughput=100.0K tks/s lr=0.0000177 time=99.67 INFO:root:[step 822999] mlm_loss=1.29088 mlm_acc=68.15869 nsp_loss=0.04584 nsp_acc=98.394 throughput=113.0K tks/s lr=0.0000177 time=116.12 INFO:root:[step 823249] mlm_loss=1.63406 mlm_acc=65.19304 nsp_loss=0.02881 nsp_acc=98.918 throughput=142.0K tks/s lr=0.0000177 time=138.48 INFO:root:[step 823499] mlm_loss=1.46058 mlm_acc=67.61990 nsp_loss=0.02470 nsp_acc=99.113 throughput=134.0K tks/s lr=0.0000177 time=122.50 INFO:root:[step 823749] mlm_loss=1.67402 mlm_acc=64.20890 nsp_loss=0.04822 nsp_acc=98.070 throughput=157.0K tks/s lr=0.0000176 time=172.94 INFO:root:[step 823999] mlm_loss=1.57567 mlm_acc=66.82852 nsp_loss=0.03634 nsp_acc=98.590 throughput=156.0K tks/s lr=0.0000176 time=154.41 INFO:root:[step 824249] mlm_loss=1.39414 mlm_acc=68.24592 nsp_loss=0.02835 nsp_acc=98.996 throughput=118.0K tks/s lr=0.0000176 time=123.70 INFO:root:[step 824499] mlm_loss=1.37220 mlm_acc=68.84409 nsp_loss=0.03200 nsp_acc=98.866 throughput=122.0K tks/s lr=0.0000176 time=109.95 INFO:root:[step 824749] mlm_loss=1.53384 mlm_acc=66.06771 nsp_loss=0.05949 nsp_acc=97.702 throughput=142.0K tks/s lr=0.0000175 time=135.99 INFO:root:[step 824999] mlm_loss=1.53832 mlm_acc=66.92078 nsp_loss=0.02537 nsp_acc=99.068 throughput=130.0K tks/s lr=0.0000175 time=132.59 INFO:root:[step 824999] Saving checkpoints to /home/ubuntu/ckpt-master/0824999.params, /home/ubuntu/ckpt-master/0824999.states. INFO:root:[step 825249] mlm_loss=1.32960 mlm_acc=68.84027 nsp_loss=0.04103 nsp_acc=98.472 throughput=100.0K tks/s lr=0.0000175 time=119.09 INFO:root:[step 825499] mlm_loss=1.44057 mlm_acc=68.29131 nsp_loss=0.02623 nsp_acc=99.065 throughput=134.0K tks/s lr=0.0000175 time=114.55 INFO:root:[step 825749] mlm_loss=1.42157 mlm_acc=68.26855 nsp_loss=0.02642 nsp_acc=99.065 throughput=119.0K tks/s lr=0.0000174 time=121.36 INFO:root:[step 825999] mlm_loss=1.53425 mlm_acc=67.28089 nsp_loss=0.02552 nsp_acc=99.064 throughput=136.0K tks/s lr=0.0000174 time=130.31 INFO:root:[step 826249] mlm_loss=1.72621 mlm_acc=62.92042 nsp_loss=0.04156 nsp_acc=98.389 throughput=149.0K tks/s lr=0.0000174 time=155.10 INFO:root:[step 826499] mlm_loss=1.49573 mlm_acc=67.37386 nsp_loss=0.02396 nsp_acc=99.164 throughput=133.0K tks/s lr=0.0000174 time=128.32 INFO:root:[step 826749] mlm_loss=1.44190 mlm_acc=68.10582 nsp_loss=0.02509 nsp_acc=99.121 throughput=129.0K tks/s lr=0.0000173 time=115.92 INFO:root:[step 826999] mlm_loss=1.28582 mlm_acc=68.97686 nsp_loss=0.04656 nsp_acc=98.241 throughput=107.0K tks/s lr=0.0000173 time=112.59 INFO:root:[step 827249] mlm_loss=1.50693 mlm_acc=67.44126 nsp_loss=0.02431 nsp_acc=99.175 throughput=138.0K tks/s lr=0.0000173 time=121.73 INFO:root:[step 827499] mlm_loss=1.50212 mlm_acc=66.52579 nsp_loss=0.04580 nsp_acc=98.252 throughput=141.0K tks/s lr=0.0000173 time=141.57 INFO:root:[step 827749] mlm_loss=1.55699 mlm_acc=65.44909 nsp_loss=0.05944 nsp_acc=97.626 throughput=151.0K tks/s lr=0.0000172 time=152.22 INFO:root:[step 827999] mlm_loss=1.49709 mlm_acc=66.79846 nsp_loss=0.03487 nsp_acc=98.689 throughput=133.0K tks/s lr=0.0000172 time=138.62 INFO:root:[step 828249] mlm_loss=1.56209 mlm_acc=65.58327 nsp_loss=0.03332 nsp_acc=98.728 throughput=145.0K tks/s lr=0.0000172 time=144.34 INFO:root:[step 828499] mlm_loss=1.42061 mlm_acc=67.73360 nsp_loss=0.03149 nsp_acc=98.876 throughput=119.0K tks/s lr=0.0000172 time=125.36 INFO:root:[step 828749] mlm_loss=1.41427 mlm_acc=68.11284 nsp_loss=0.02760 nsp_acc=99.031 throughput=131.0K tks/s lr=0.0000171 time=114.79 INFO:root:[step 828999] mlm_loss=1.46971 mlm_acc=66.14486 nsp_loss=0.03539 nsp_acc=98.708 throughput=141.0K tks/s lr=0.0000171 time=144.33 INFO:root:[step 829249] mlm_loss=1.49071 mlm_acc=67.49082 nsp_loss=0.02472 nsp_acc=99.095 throughput=129.0K tks/s lr=0.0000171 time=126.90 INFO:root:[step 829499] mlm_loss=1.42914 mlm_acc=68.32471 nsp_loss=0.02836 nsp_acc=99.038 throughput=128.0K tks/s lr=0.0000171 time=116.48 INFO:root:[step 829749] mlm_loss=1.36029 mlm_acc=68.89875 nsp_loss=0.02757 nsp_acc=99.023 throughput=112.0K tks/s lr=0.0000170 time=115.91 INFO:root:[step 829999] mlm_loss=1.42205 mlm_acc=68.33360 nsp_loss=0.02739 nsp_acc=99.047 throughput=129.0K tks/s lr=0.0000170 time=118.25 INFO:root:[step 829999] Saving checkpoints to /home/ubuntu/ckpt-master/0829999.params, /home/ubuntu/ckpt-master/0829999.states. INFO:root:[step 830249] mlm_loss=1.49025 mlm_acc=67.37124 nsp_loss=0.02330 nsp_acc=99.166 throughput=121.0K tks/s lr=0.0000170 time=144.67 INFO:root:[step 830499] mlm_loss=1.58339 mlm_acc=65.27578 nsp_loss=0.03355 nsp_acc=98.719 throughput=141.0K tks/s lr=0.0000170 time=140.97 INFO:root:[step 830749] mlm_loss=1.40099 mlm_acc=68.49325 nsp_loss=0.02939 nsp_acc=98.957 throughput=129.0K tks/s lr=0.0000169 time=110.79 INFO:root:[step 830999] mlm_loss=1.51018 mlm_acc=67.51547 nsp_loss=0.01975 nsp_acc=99.315 throughput=133.0K tks/s lr=0.0000169 time=129.58 INFO:root:[step 831249] mlm_loss=1.42140 mlm_acc=68.39224 nsp_loss=0.02782 nsp_acc=99.061 throughput=126.0K tks/s lr=0.0000169 time=112.40 INFO:root:[step 831499] mlm_loss=1.59141 mlm_acc=65.96357 nsp_loss=0.03316 nsp_acc=98.777 throughput=146.0K tks/s lr=0.0000169 time=156.50 INFO:root:[step 831749] mlm_loss=1.45735 mlm_acc=67.80840 nsp_loss=0.02565 nsp_acc=99.111 throughput=137.0K tks/s lr=0.0000168 time=123.43 INFO:root:[step 831999] mlm_loss=1.44223 mlm_acc=67.52813 nsp_loss=0.02737 nsp_acc=99.016 throughput=124.0K tks/s lr=0.0000168 time=128.47 INFO:root:[step 832249] mlm_loss=1.52743 mlm_acc=65.47076 nsp_loss=0.03367 nsp_acc=98.776 throughput=136.0K tks/s lr=0.0000168 time=135.67 INFO:root:[step 832499] mlm_loss=1.45901 mlm_acc=67.56759 nsp_loss=0.02737 nsp_acc=99.012 throughput=138.0K tks/s lr=0.0000168 time=117.10 INFO:root:[step 832749] mlm_loss=1.37581 mlm_acc=68.57799 nsp_loss=0.02904 nsp_acc=99.003 throughput=119.0K tks/s lr=0.0000167 time=120.29 INFO:root:[step 832999] mlm_loss=1.66654 mlm_acc=65.20993 nsp_loss=0.01781 nsp_acc=99.351 throughput=155.0K tks/s lr=0.0000167 time=155.35 INFO:root:[step 833249] mlm_loss=1.43372 mlm_acc=66.79899 nsp_loss=0.03504 nsp_acc=98.753 throughput=125.0K tks/s lr=0.0000167 time=125.01 INFO:root:[step 833499] mlm_loss=1.53491 mlm_acc=65.24861 nsp_loss=0.03750 nsp_acc=98.636 throughput=140.0K tks/s lr=0.0000167 time=125.87 INFO:root:[step 833749] mlm_loss=1.38196 mlm_acc=67.45801 nsp_loss=0.03832 nsp_acc=98.618 throughput=118.0K tks/s lr=0.0000166 time=122.16 INFO:root:[step 833999] mlm_loss=1.50664 mlm_acc=66.52927 nsp_loss=0.03826 nsp_acc=98.568 throughput=135.0K tks/s lr=0.0000166 time=135.06 INFO:root:[step 834249] mlm_loss=1.52601 mlm_acc=66.90137 nsp_loss=0.04563 nsp_acc=98.247 throughput=137.0K tks/s lr=0.0000166 time=140.39 INFO:root:[step 834499] mlm_loss=1.41881 mlm_acc=67.43413 nsp_loss=0.03331 nsp_acc=98.819 throughput=145.0K tks/s lr=0.0000166 time=122.64 INFO:root:[step 834749] mlm_loss=1.74168 mlm_acc=63.91404 nsp_loss=0.08930 nsp_acc=96.268 throughput=152.0K tks/s lr=0.0000165 time=152.94 INFO:root:[step 834999] mlm_loss=1.53164 mlm_acc=66.67755 nsp_loss=0.02581 nsp_acc=99.055 throughput=133.0K tks/s lr=0.0000165 time=130.64 INFO:root:[step 834999] Saving checkpoints to /home/ubuntu/ckpt-master/0834999.params, /home/ubuntu/ckpt-master/0834999.states. INFO:root:[step 835249] mlm_loss=1.51689 mlm_acc=66.39835 nsp_loss=0.06971 nsp_acc=97.174 throughput=117.0K tks/s lr=0.0000165 time=148.56 INFO:root:[step 835499] mlm_loss=1.43895 mlm_acc=66.94999 nsp_loss=0.03901 nsp_acc=98.529 throughput=137.0K tks/s lr=0.0000165 time=136.77 INFO:root:[step 835749] mlm_loss=1.39965 mlm_acc=68.08148 nsp_loss=0.03432 nsp_acc=98.735 throughput=129.0K tks/s lr=0.0000164 time=111.85 INFO:root:[step 835999] mlm_loss=1.65332 mlm_acc=64.63207 nsp_loss=0.04109 nsp_acc=98.438 throughput=143.0K tks/s lr=0.0000164 time=142.20 INFO:root:[step 836249] mlm_loss=1.66221 mlm_acc=64.23951 nsp_loss=0.02866 nsp_acc=98.939 throughput=143.0K tks/s lr=0.0000164 time=144.88 INFO:root:[step 836499] mlm_loss=1.55903 mlm_acc=66.82868 nsp_loss=0.02088 nsp_acc=99.247 throughput=138.0K tks/s lr=0.0000164 time=135.67 INFO:root:[step 836749] mlm_loss=1.55305 mlm_acc=66.98705 nsp_loss=0.02002 nsp_acc=99.278 throughput=139.0K tks/s lr=0.0000163 time=134.07 INFO:root:[step 836999] mlm_loss=1.53648 mlm_acc=66.79545 nsp_loss=0.02076 nsp_acc=99.266 throughput=139.0K tks/s lr=0.0000163 time=138.07 INFO:root:[step 837249] mlm_loss=1.44210 mlm_acc=68.06779 nsp_loss=0.02500 nsp_acc=99.103 throughput=133.0K tks/s lr=0.0000163 time=113.42 INFO:root:[step 837499] mlm_loss=1.37388 mlm_acc=68.59345 nsp_loss=0.03410 nsp_acc=98.730 throughput=107.0K tks/s lr=0.0000163 time=119.33 INFO:root:[step 837749] mlm_loss=1.38738 mlm_acc=68.48696 nsp_loss=0.02730 nsp_acc=99.052 throughput=127.0K tks/s lr=0.0000162 time=113.57 INFO:root:[step 837999] mlm_loss=1.43894 mlm_acc=68.13037 nsp_loss=0.02739 nsp_acc=99.018 throughput=118.0K tks/s lr=0.0000162 time=122.13 INFO:root:[step 838249] mlm_loss=1.55888 mlm_acc=65.29183 nsp_loss=0.02754 nsp_acc=99.005 throughput=146.0K tks/s lr=0.0000162 time=140.95 INFO:root:[step 838499] mlm_loss=1.66310 mlm_acc=64.45667 nsp_loss=0.05951 nsp_acc=97.660 throughput=162.0K tks/s lr=0.0000162 time=168.39 INFO:root:[step 838749] mlm_loss=1.43186 mlm_acc=67.03006 nsp_loss=0.03606 nsp_acc=98.679 throughput=119.0K tks/s lr=0.0000161 time=125.36 INFO:root:[step 838999] mlm_loss=1.44363 mlm_acc=67.78668 nsp_loss=0.02558 nsp_acc=99.117 throughput=134.0K tks/s lr=0.0000161 time=114.45 INFO:root:[step 839249] mlm_loss=1.53798 mlm_acc=67.13320 nsp_loss=0.02078 nsp_acc=99.311 throughput=136.0K tks/s lr=0.0000161 time=131.94 INFO:root:[step 839499] mlm_loss=1.42279 mlm_acc=68.29230 nsp_loss=0.02638 nsp_acc=99.076 throughput=130.0K tks/s lr=0.0000161 time=114.00 INFO:root:[step 839749] mlm_loss=1.55341 mlm_acc=66.16142 nsp_loss=0.03981 nsp_acc=98.492 throughput=141.0K tks/s lr=0.0000160 time=139.67 INFO:root:[step 839999] mlm_loss=1.49063 mlm_acc=66.32470 nsp_loss=0.03614 nsp_acc=98.669 throughput=138.0K tks/s lr=0.0000160 time=139.67 INFO:root:[step 839999] Saving checkpoints to /home/ubuntu/ckpt-master/0839999.params, /home/ubuntu/ckpt-master/0839999.states. INFO:root:[step 840249] mlm_loss=1.22574 mlm_acc=69.68654 nsp_loss=0.03879 nsp_acc=98.586 throughput=99.0K tks/s lr=0.0000160 time=121.43 INFO:root:[step 840499] mlm_loss=1.43749 mlm_acc=67.24128 nsp_loss=0.03306 nsp_acc=98.817 throughput=127.0K tks/s lr=0.0000160 time=125.11 INFO:root:[step 840749] mlm_loss=1.67135 mlm_acc=64.71802 nsp_loss=0.04203 nsp_acc=98.436 throughput=151.0K tks/s lr=0.0000159 time=155.22 INFO:root:[step 840999] mlm_loss=1.54709 mlm_acc=66.53463 nsp_loss=0.03072 nsp_acc=98.872 throughput=141.0K tks/s lr=0.0000159 time=139.71 INFO:root:[step 841249] mlm_loss=1.40894 mlm_acc=67.71289 nsp_loss=0.03500 nsp_acc=98.707 throughput=122.0K tks/s lr=0.0000159 time=128.07 INFO:root:[step 841499] mlm_loss=1.37491 mlm_acc=68.94189 nsp_loss=0.02978 nsp_acc=98.953 throughput=120.0K tks/s lr=0.0000159 time=109.08 INFO:root:[step 841749] mlm_loss=1.35211 mlm_acc=69.09545 nsp_loss=0.03165 nsp_acc=98.890 throughput=119.0K tks/s lr=0.0000158 time=107.40 INFO:root:[step 841999] mlm_loss=1.54028 mlm_acc=66.61679 nsp_loss=0.02168 nsp_acc=99.239 throughput=146.0K tks/s lr=0.0000158 time=158.93 INFO:root:[step 842249] mlm_loss=1.37194 mlm_acc=68.69862 nsp_loss=0.02759 nsp_acc=99.027 throughput=121.0K tks/s lr=0.0000158 time=111.39 INFO:root:[step 842499] mlm_loss=1.29358 mlm_acc=69.67325 nsp_loss=0.03001 nsp_acc=98.941 throughput=120.0K tks/s lr=0.0000158 time=106.84 INFO:root:[step 842749] mlm_loss=1.30381 mlm_acc=69.84192 nsp_loss=0.02635 nsp_acc=99.073 throughput=123.0K tks/s lr=0.0000157 time=108.74 INFO:root:[step 842999] mlm_loss=1.50571 mlm_acc=67.02121 nsp_loss=0.02078 nsp_acc=99.271 throughput=140.0K tks/s lr=0.0000157 time=133.66 INFO:root:[step 843249] mlm_loss=1.52990 mlm_acc=66.36973 nsp_loss=0.05763 nsp_acc=97.665 throughput=136.0K tks/s lr=0.0000157 time=133.76 INFO:root:[step 843499] mlm_loss=1.59625 mlm_acc=65.03447 nsp_loss=0.07081 nsp_acc=97.119 throughput=146.0K tks/s lr=0.0000157 time=143.96 INFO:root:[step 843749] mlm_loss=1.54862 mlm_acc=65.76333 nsp_loss=0.04243 nsp_acc=98.341 throughput=149.0K tks/s lr=0.0000156 time=148.71 INFO:root:[step 843999] mlm_loss=1.69143 mlm_acc=64.16081 nsp_loss=0.01493 nsp_acc=99.471 throughput=147.0K tks/s lr=0.0000156 time=162.70 INFO:root:[step 844249] mlm_loss=1.51527 mlm_acc=65.80020 nsp_loss=0.03532 nsp_acc=98.676 throughput=139.0K tks/s lr=0.0000156 time=140.40 INFO:root:[step 844499] mlm_loss=1.36879 mlm_acc=68.48701 nsp_loss=0.02600 nsp_acc=99.094 throughput=131.0K tks/s lr=0.0000156 time=115.70 INFO:root:[step 844749] mlm_loss=1.37723 mlm_acc=70.60715 nsp_loss=0.02204 nsp_acc=99.257 throughput=146.0K tks/s lr=0.0000155 time=142.45 INFO:root:[step 844999] mlm_loss=1.45735 mlm_acc=69.17334 nsp_loss=0.01818 nsp_acc=99.364 throughput=146.0K tks/s lr=0.0000155 time=143.53 INFO:root:[step 844999] Saving checkpoints to /home/ubuntu/ckpt-master/0844999.params, /home/ubuntu/ckpt-master/0844999.states. INFO:root:[step 845249] mlm_loss=1.56946 mlm_acc=66.26044 nsp_loss=0.03761 nsp_acc=98.489 throughput=136.0K tks/s lr=0.0000155 time=161.31 INFO:root:[step 845499] mlm_loss=1.44512 mlm_acc=68.22201 nsp_loss=0.02019 nsp_acc=99.300 throughput=129.0K tks/s lr=0.0000155 time=128.25 INFO:root:[step 845749] mlm_loss=1.42710 mlm_acc=68.19702 nsp_loss=0.02232 nsp_acc=99.227 throughput=127.0K tks/s lr=0.0000154 time=121.86 INFO:root:[step 845999] mlm_loss=1.41160 mlm_acc=67.80085 nsp_loss=0.02310 nsp_acc=99.197 throughput=136.0K tks/s lr=0.0000154 time=124.82 INFO:root:[step 846249] mlm_loss=1.37694 mlm_acc=68.58874 nsp_loss=0.02566 nsp_acc=99.114 throughput=121.0K tks/s lr=0.0000154 time=119.48 INFO:root:[step 846499] mlm_loss=1.52921 mlm_acc=67.24994 nsp_loss=0.01523 nsp_acc=99.479 throughput=140.0K tks/s lr=0.0000154 time=135.96 INFO:root:[step 846749] mlm_loss=1.49572 mlm_acc=67.72340 nsp_loss=0.01921 nsp_acc=99.329 throughput=138.0K tks/s lr=0.0000153 time=124.17 INFO:root:[step 846999] mlm_loss=1.31536 mlm_acc=69.42337 nsp_loss=0.02822 nsp_acc=99.004 throughput=113.0K tks/s lr=0.0000153 time=118.25 INFO:root:[step 847249] mlm_loss=1.44237 mlm_acc=67.86897 nsp_loss=0.02021 nsp_acc=99.308 throughput=139.0K tks/s lr=0.0000153 time=117.76 INFO:root:[step 847499] mlm_loss=1.64615 mlm_acc=64.42193 nsp_loss=0.02229 nsp_acc=99.208 throughput=144.0K tks/s lr=0.0000153 time=145.04 INFO:root:[step 847749] mlm_loss=1.25268 mlm_acc=69.93692 nsp_loss=0.03293 nsp_acc=98.839 throughput=105.0K tks/s lr=0.0000152 time=115.14 INFO:root:[step 847999] mlm_loss=1.29220 mlm_acc=71.18612 nsp_loss=0.02864 nsp_acc=99.030 throughput=139.0K tks/s lr=0.0000152 time=119.88 INFO:root:[step 848249] mlm_loss=1.35580 mlm_acc=69.01525 nsp_loss=0.03014 nsp_acc=98.921 throughput=125.0K tks/s lr=0.0000152 time=122.39 INFO:root:[step 848499] mlm_loss=1.52283 mlm_acc=66.62429 nsp_loss=0.02391 nsp_acc=99.134 throughput=141.0K tks/s lr=0.0000152 time=143.87 INFO:root:[step 848749] mlm_loss=1.34224 mlm_acc=69.08608 nsp_loss=0.02732 nsp_acc=99.034 throughput=121.0K tks/s lr=0.0000151 time=111.82 INFO:root:[step 848999] mlm_loss=1.52430 mlm_acc=66.31487 nsp_loss=0.02481 nsp_acc=99.127 throughput=137.0K tks/s lr=0.0000151 time=130.26 INFO:root:[step 849249] mlm_loss=1.46305 mlm_acc=66.43407 nsp_loss=0.03711 nsp_acc=98.609 throughput=127.0K tks/s lr=0.0000151 time=127.97 INFO:root:[step 849499] mlm_loss=1.26139 mlm_acc=73.05463 nsp_loss=0.02739 nsp_acc=99.087 throughput=147.0K tks/s lr=0.0000151 time=129.93 INFO:root:[step 849749] mlm_loss=1.27984 mlm_acc=70.97369 nsp_loss=0.02843 nsp_acc=99.023 throughput=111.0K tks/s lr=0.0000150 time=118.73 INFO:root:[step 849999] mlm_loss=1.37990 mlm_acc=68.67238 nsp_loss=0.02509 nsp_acc=99.141 throughput=126.0K tks/s lr=0.0000150 time=112.19 INFO:root:[step 849999] Saving checkpoints to /home/ubuntu/ckpt-master/0849999.params, /home/ubuntu/ckpt-master/0849999.states. INFO:root:[step 850249] mlm_loss=1.36394 mlm_acc=69.01540 nsp_loss=0.02560 nsp_acc=99.117 throughput=107.0K tks/s lr=0.0000150 time=123.72 INFO:root:[step 850499] mlm_loss=1.46800 mlm_acc=67.49070 nsp_loss=0.03713 nsp_acc=98.567 throughput=144.0K tks/s lr=0.0000150 time=143.28 INFO:root:[step 850749] mlm_loss=1.64783 mlm_acc=64.95492 nsp_loss=0.02334 nsp_acc=99.141 throughput=143.0K tks/s lr=0.0000149 time=139.24 INFO:root:[step 850999] mlm_loss=1.72887 mlm_acc=63.80892 nsp_loss=0.05091 nsp_acc=97.970 throughput=152.0K tks/s lr=0.0000149 time=168.50 INFO:root:[step 851249] mlm_loss=1.52972 mlm_acc=65.29403 nsp_loss=0.03365 nsp_acc=98.745 throughput=139.0K tks/s lr=0.0000149 time=124.33 INFO:root:[step 851499] mlm_loss=1.35544 mlm_acc=68.75568 nsp_loss=0.02526 nsp_acc=99.131 throughput=116.0K tks/s lr=0.0000149 time=118.37 INFO:root:[step 851749] mlm_loss=1.52231 mlm_acc=66.56443 nsp_loss=0.02768 nsp_acc=99.039 throughput=147.0K tks/s lr=0.0000148 time=147.56 INFO:root:[step 851999] mlm_loss=1.49753 mlm_acc=66.98959 nsp_loss=0.01881 nsp_acc=99.338 throughput=132.0K tks/s lr=0.0000148 time=132.25 INFO:root:[step 852249] mlm_loss=1.50065 mlm_acc=65.97795 nsp_loss=0.03197 nsp_acc=98.855 throughput=139.0K tks/s lr=0.0000148 time=122.01 INFO:root:[step 852499] mlm_loss=1.43392 mlm_acc=67.91326 nsp_loss=0.02610 nsp_acc=99.093 throughput=122.0K tks/s lr=0.0000148 time=128.26 INFO:root:[step 852749] mlm_loss=1.35736 mlm_acc=68.83063 nsp_loss=0.02767 nsp_acc=99.051 throughput=126.0K tks/s lr=0.0000147 time=108.50 INFO:root:[step 852999] mlm_loss=1.43780 mlm_acc=66.92016 nsp_loss=0.03292 nsp_acc=98.785 throughput=136.0K tks/s lr=0.0000147 time=138.60 INFO:root:[step 853249] mlm_loss=1.41805 mlm_acc=68.26887 nsp_loss=0.02161 nsp_acc=99.234 throughput=124.0K tks/s lr=0.0000147 time=122.01 INFO:root:[step 853499] mlm_loss=1.69255 mlm_acc=64.62041 nsp_loss=0.03493 nsp_acc=98.597 throughput=142.0K tks/s lr=0.0000147 time=143.03 INFO:root:[step 853749] mlm_loss=1.33701 mlm_acc=69.24138 nsp_loss=0.03095 nsp_acc=98.905 throughput=121.0K tks/s lr=0.0000146 time=106.99 INFO:root:[step 853999] mlm_loss=1.54792 mlm_acc=64.95838 nsp_loss=0.02723 nsp_acc=99.018 throughput=140.0K tks/s lr=0.0000146 time=142.23 INFO:root:[step 854249] mlm_loss=1.42230 mlm_acc=68.26558 nsp_loss=0.02321 nsp_acc=99.210 throughput=132.0K tks/s lr=0.0000146 time=116.55 INFO:root:[step 854499] mlm_loss=1.38067 mlm_acc=68.33533 nsp_loss=0.02779 nsp_acc=99.017 throughput=120.0K tks/s lr=0.0000146 time=119.39 INFO:root:[step 854749] mlm_loss=1.39075 mlm_acc=68.15582 nsp_loss=0.02727 nsp_acc=99.000 throughput=127.0K tks/s lr=0.0000145 time=116.73 INFO:root:[step 854999] mlm_loss=1.05083 mlm_acc=76.58675 nsp_loss=0.03524 nsp_acc=98.889 throughput=132.0K tks/s lr=0.0000145 time=132.87 INFO:root:[step 854999] Saving checkpoints to /home/ubuntu/ckpt-master/0854999.params, /home/ubuntu/ckpt-master/0854999.states. INFO:root:[step 855249] mlm_loss=1.49305 mlm_acc=67.04787 nsp_loss=0.01714 nsp_acc=99.403 throughput=123.0K tks/s lr=0.0000145 time=145.55 INFO:root:[step 855499] mlm_loss=1.44300 mlm_acc=67.41840 nsp_loss=0.01982 nsp_acc=99.315 throughput=134.0K tks/s lr=0.0000145 time=119.96 INFO:root:[step 855749] mlm_loss=1.53023 mlm_acc=67.37869 nsp_loss=0.01707 nsp_acc=99.438 throughput=135.0K tks/s lr=0.0000144 time=131.78 INFO:root:[step 855999] mlm_loss=1.39324 mlm_acc=68.35009 nsp_loss=0.02756 nsp_acc=99.048 throughput=122.0K tks/s lr=0.0000144 time=120.43 INFO:root:[step 856249] mlm_loss=1.59532 mlm_acc=65.49781 nsp_loss=0.02753 nsp_acc=98.997 throughput=140.0K tks/s lr=0.0000144 time=137.89 INFO:root:[step 856499] mlm_loss=1.48201 mlm_acc=67.78675 nsp_loss=0.02061 nsp_acc=99.311 throughput=136.0K tks/s lr=0.0000144 time=120.19 INFO:root:[step 856749] mlm_loss=1.53515 mlm_acc=67.09049 nsp_loss=0.01681 nsp_acc=99.426 throughput=138.0K tks/s lr=0.0000143 time=132.19 INFO:root:[step 856999] mlm_loss=1.42760 mlm_acc=67.91056 nsp_loss=0.02369 nsp_acc=99.171 throughput=121.0K tks/s lr=0.0000143 time=127.03 INFO:root:[step 857249] mlm_loss=1.33176 mlm_acc=69.46671 nsp_loss=0.02577 nsp_acc=99.108 throughput=121.0K tks/s lr=0.0000143 time=108.79 INFO:root:[step 857499] mlm_loss=1.32660 mlm_acc=69.34462 nsp_loss=0.02630 nsp_acc=99.104 throughput=121.0K tks/s lr=0.0000143 time=109.47 INFO:root:[step 857749] mlm_loss=1.62888 mlm_acc=64.87841 nsp_loss=0.02226 nsp_acc=99.238 throughput=142.0K tks/s lr=0.0000142 time=141.13 INFO:root:[step 857999] mlm_loss=1.45468 mlm_acc=67.05164 nsp_loss=0.02353 nsp_acc=99.198 throughput=124.0K tks/s lr=0.0000142 time=125.67 INFO:root:[step 858499] mlm_loss=2.89381 mlm_acc=67.34312 nsp_loss=0.05867 nsp_acc=98.906 throughput=134.0K tks/s lr=0.0000142 time=250.69 INFO:root:[step 858749] mlm_loss=1.47490 mlm_acc=66.11536 nsp_loss=0.03630 nsp_acc=98.601 throughput=142.0K tks/s lr=0.0000141 time=146.07 INFO:root:[step 858999] mlm_loss=1.48099 mlm_acc=65.53369 nsp_loss=0.03054 nsp_acc=98.929 throughput=138.0K tks/s lr=0.0000141 time=138.43 INFO:root:[step 859249] mlm_loss=1.33548 mlm_acc=69.46846 nsp_loss=0.02616 nsp_acc=99.126 throughput=130.0K tks/s lr=0.0000141 time=111.73 INFO:root:[step 859499] mlm_loss=1.49958 mlm_acc=67.74286 nsp_loss=0.02050 nsp_acc=99.317 throughput=129.0K tks/s lr=0.0000141 time=128.65 INFO:root:[step 859749] mlm_loss=1.61073 mlm_acc=65.03104 nsp_loss=0.04207 nsp_acc=98.350 throughput=156.0K tks/s lr=0.0000140 time=158.01 INFO:root:[step 859999] mlm_loss=1.63683 mlm_acc=64.82439 nsp_loss=0.01769 nsp_acc=99.345 throughput=146.0K tks/s lr=0.0000140 time=158.61 INFO:root:[step 859999] Saving checkpoints to /home/ubuntu/ckpt-master/0859999.params, /home/ubuntu/ckpt-master/0859999.states. INFO:root:[step 860249] mlm_loss=1.41155 mlm_acc=67.88195 nsp_loss=0.02287 nsp_acc=99.207 throughput=119.0K tks/s lr=0.0000140 time=138.57 INFO:root:[step 860499] mlm_loss=1.58283 mlm_acc=65.80608 nsp_loss=0.01879 nsp_acc=99.372 throughput=147.0K tks/s lr=0.0000140 time=141.30 INFO:root:[step 860749] mlm_loss=1.46310 mlm_acc=67.49609 nsp_loss=0.01919 nsp_acc=99.350 throughput=131.0K tks/s lr=0.0000139 time=132.22 INFO:root:[step 860999] mlm_loss=1.44934 mlm_acc=68.22629 nsp_loss=0.02036 nsp_acc=99.275 throughput=128.0K tks/s lr=0.0000139 time=125.21 INFO:root:[step 861249] mlm_loss=1.35379 mlm_acc=69.11983 nsp_loss=0.03457 nsp_acc=98.814 throughput=129.0K tks/s lr=0.0000139 time=114.86 INFO:root:[step 861499] mlm_loss=1.67171 mlm_acc=64.40416 nsp_loss=0.03964 nsp_acc=98.510 throughput=138.0K tks/s lr=0.0000139 time=136.93 INFO:root:[step 861749] mlm_loss=1.44074 mlm_acc=68.28847 nsp_loss=0.02353 nsp_acc=99.170 throughput=127.0K tks/s lr=0.0000138 time=128.30 INFO:root:[step 861999] mlm_loss=1.38700 mlm_acc=68.76335 nsp_loss=0.02637 nsp_acc=99.068 throughput=123.0K tks/s lr=0.0000138 time=110.97 INFO:root:[step 862249] mlm_loss=1.25682 mlm_acc=69.96926 nsp_loss=0.03121 nsp_acc=98.937 throughput=122.0K tks/s lr=0.0000138 time=107.67 INFO:root:[step 862499] mlm_loss=1.41571 mlm_acc=68.45447 nsp_loss=0.02303 nsp_acc=99.176 throughput=121.0K tks/s lr=0.0000138 time=121.04 INFO:root:[step 862749] mlm_loss=1.58529 mlm_acc=65.71833 nsp_loss=0.03484 nsp_acc=98.659 throughput=152.0K tks/s lr=0.0000137 time=168.84 INFO:root:[step 862999] mlm_loss=1.44171 mlm_acc=69.00315 nsp_loss=0.02052 nsp_acc=99.306 throughput=146.0K tks/s lr=0.0000137 time=125.99 INFO:root:[step 863249] mlm_loss=1.68175 mlm_acc=63.93743 nsp_loss=0.04184 nsp_acc=98.381 throughput=149.0K tks/s lr=0.0000137 time=166.86 INFO:root:[step 863499] mlm_loss=1.48096 mlm_acc=66.36246 nsp_loss=0.04136 nsp_acc=98.442 throughput=143.0K tks/s lr=0.0000137 time=141.45 INFO:root:[step 863749] mlm_loss=1.66486 mlm_acc=64.82828 nsp_loss=0.03142 nsp_acc=98.782 throughput=162.0K tks/s lr=0.0000136 time=167.92 INFO:root:[step 863999] mlm_loss=1.48813 mlm_acc=66.39577 nsp_loss=0.03265 nsp_acc=98.780 throughput=145.0K tks/s lr=0.0000136 time=145.25 INFO:root:[step 864249] mlm_loss=1.48211 mlm_acc=67.06224 nsp_loss=0.06619 nsp_acc=97.268 throughput=124.0K tks/s lr=0.0000136 time=135.12 INFO:root:[step 864499] mlm_loss=1.48776 mlm_acc=66.72006 nsp_loss=0.02057 nsp_acc=99.299 throughput=140.0K tks/s lr=0.0000136 time=129.49 INFO:root:[step 864749] mlm_loss=1.54745 mlm_acc=65.07181 nsp_loss=0.02466 nsp_acc=99.122 throughput=136.0K tks/s lr=0.0000135 time=134.08 INFO:root:[step 864999] mlm_loss=1.52181 mlm_acc=67.35635 nsp_loss=0.01650 nsp_acc=99.445 throughput=145.0K tks/s lr=0.0000135 time=128.57 INFO:root:[step 864999] Saving checkpoints to /home/ubuntu/ckpt-master/0864999.params, /home/ubuntu/ckpt-master/0864999.states. INFO:root:[step 865249] mlm_loss=1.57152 mlm_acc=66.25444 nsp_loss=0.01430 nsp_acc=99.521 throughput=125.0K tks/s lr=0.0000135 time=165.54 INFO:root:[step 865499] mlm_loss=1.48817 mlm_acc=65.92161 nsp_loss=0.03341 nsp_acc=98.775 throughput=140.0K tks/s lr=0.0000135 time=121.03 INFO:root:[step 865749] mlm_loss=1.44077 mlm_acc=67.62326 nsp_loss=0.02391 nsp_acc=99.213 throughput=128.0K tks/s lr=0.0000134 time=126.93 INFO:root:[step 865999] mlm_loss=1.54708 mlm_acc=66.58584 nsp_loss=0.02541 nsp_acc=99.089 throughput=146.0K tks/s lr=0.0000134 time=144.95 INFO:root:[step 866249] mlm_loss=1.41957 mlm_acc=68.42161 nsp_loss=0.02368 nsp_acc=99.184 throughput=130.0K tks/s lr=0.0000134 time=114.79 INFO:root:[step 866499] mlm_loss=1.30717 mlm_acc=69.71645 nsp_loss=0.02595 nsp_acc=99.133 throughput=111.0K tks/s lr=0.0000134 time=115.52 INFO:root:[step 866749] mlm_loss=1.42830 mlm_acc=68.47495 nsp_loss=0.02237 nsp_acc=99.232 throughput=129.0K tks/s lr=0.0000133 time=115.32 INFO:root:[step 866999] mlm_loss=1.58735 mlm_acc=66.05530 nsp_loss=0.02670 nsp_acc=98.970 throughput=148.0K tks/s lr=0.0000133 time=144.45 INFO:root:[step 867249] mlm_loss=1.56983 mlm_acc=66.93193 nsp_loss=0.01970 nsp_acc=99.332 throughput=140.0K tks/s lr=0.0000133 time=136.76 INFO:root:[step 867499] mlm_loss=1.43233 mlm_acc=68.05755 nsp_loss=0.02441 nsp_acc=99.167 throughput=121.0K tks/s lr=0.0000133 time=124.55 INFO:root:[step 867749] mlm_loss=1.60826 mlm_acc=64.72190 nsp_loss=0.04903 nsp_acc=98.081 throughput=132.0K tks/s lr=0.0000132 time=118.99 INFO:root:[step 867999] mlm_loss=1.53238 mlm_acc=66.76981 nsp_loss=0.02951 nsp_acc=98.910 throughput=130.0K tks/s lr=0.0000132 time=129.48 INFO:root:[step 868249] mlm_loss=1.51226 mlm_acc=66.19095 nsp_loss=0.02778 nsp_acc=98.941 throughput=147.0K tks/s lr=0.0000132 time=143.99 INFO:root:[step 868499] mlm_loss=1.57166 mlm_acc=66.96959 nsp_loss=0.01458 nsp_acc=99.493 throughput=142.0K tks/s lr=0.0000132 time=138.15 INFO:root:[step 868749] mlm_loss=1.37712 mlm_acc=68.50613 nsp_loss=0.02670 nsp_acc=99.058 throughput=128.0K tks/s lr=0.0000131 time=116.27 INFO:root:[step 868999] mlm_loss=1.55337 mlm_acc=66.10863 nsp_loss=0.06434 nsp_acc=97.264 throughput=141.0K tks/s lr=0.0000131 time=141.99 INFO:root:[step 869249] mlm_loss=1.33704 mlm_acc=68.95571 nsp_loss=0.02842 nsp_acc=99.015 throughput=116.0K tks/s lr=0.0000131 time=119.91 INFO:root:[step 869499] mlm_loss=1.33415 mlm_acc=69.15320 nsp_loss=0.02922 nsp_acc=98.989 throughput=123.0K tks/s lr=0.0000131 time=109.30 INFO:root:[step 869749] mlm_loss=1.45425 mlm_acc=68.07638 nsp_loss=0.02056 nsp_acc=99.275 throughput=132.0K tks/s lr=0.0000130 time=126.75 INFO:root:[step 869999] mlm_loss=1.45903 mlm_acc=68.12029 nsp_loss=0.02188 nsp_acc=99.238 throughput=131.0K tks/s lr=0.0000130 time=118.73 INFO:root:[step 869999] Saving checkpoints to /home/ubuntu/ckpt-master/0869999.params, /home/ubuntu/ckpt-master/0869999.states. INFO:root:[step 870249] mlm_loss=1.44583 mlm_acc=68.09653 nsp_loss=0.02190 nsp_acc=99.252 throughput=113.0K tks/s lr=0.0000130 time=137.21 INFO:root:[step 870499] mlm_loss=1.51515 mlm_acc=67.73623 nsp_loss=0.01822 nsp_acc=99.380 throughput=134.0K tks/s lr=0.0000130 time=130.74 INFO:root:[step 870749] mlm_loss=1.42794 mlm_acc=68.38320 nsp_loss=0.02202 nsp_acc=99.239 throughput=132.0K tks/s lr=0.0000129 time=117.16 INFO:root:[step 870999] mlm_loss=1.60172 mlm_acc=65.06964 nsp_loss=0.02016 nsp_acc=99.277 throughput=148.0K tks/s lr=0.0000129 time=147.13 INFO:root:[step 871249] mlm_loss=1.58796 mlm_acc=65.08000 nsp_loss=0.02633 nsp_acc=98.999 throughput=140.0K tks/s lr=0.0000129 time=139.14 INFO:root:[step 871499] mlm_loss=1.50033 mlm_acc=66.27003 nsp_loss=0.04016 nsp_acc=98.431 throughput=136.0K tks/s lr=0.0000129 time=136.98 INFO:root:[step 871749] mlm_loss=1.35439 mlm_acc=69.25996 nsp_loss=0.02893 nsp_acc=99.006 throughput=120.0K tks/s lr=0.0000128 time=106.98 INFO:root:[step 871999] mlm_loss=1.49140 mlm_acc=67.62096 nsp_loss=0.02093 nsp_acc=99.283 throughput=130.0K tks/s lr=0.0000128 time=129.10 INFO:root:[step 872249] mlm_loss=1.42467 mlm_acc=68.52139 nsp_loss=0.02110 nsp_acc=99.248 throughput=126.0K tks/s lr=0.0000128 time=122.66 INFO:root:[step 872499] mlm_loss=1.64996 mlm_acc=65.03076 nsp_loss=0.02041 nsp_acc=99.257 throughput=150.0K tks/s lr=0.0000128 time=147.12 INFO:root:[step 872749] mlm_loss=1.58797 mlm_acc=66.69303 nsp_loss=0.01451 nsp_acc=99.472 throughput=145.0K tks/s lr=0.0000127 time=142.92 INFO:root:[step 872999] mlm_loss=1.49074 mlm_acc=67.93417 nsp_loss=0.01885 nsp_acc=99.360 throughput=134.0K tks/s lr=0.0000127 time=131.19 INFO:root:[step 873249] mlm_loss=1.54011 mlm_acc=67.29080 nsp_loss=0.01496 nsp_acc=99.497 throughput=140.0K tks/s lr=0.0000127 time=135.90 INFO:root:[step 873499] mlm_loss=1.44486 mlm_acc=67.83810 nsp_loss=0.02143 nsp_acc=99.242 throughput=138.0K tks/s lr=0.0000127 time=121.30 INFO:root:[step 873749] mlm_loss=1.56638 mlm_acc=65.11579 nsp_loss=0.03441 nsp_acc=98.731 throughput=134.0K tks/s lr=0.0000126 time=133.79 INFO:root:[step 873999] mlm_loss=1.51243 mlm_acc=67.14177 nsp_loss=0.01841 nsp_acc=99.349 throughput=134.0K tks/s lr=0.0000126 time=133.19 INFO:root:[step 874249] mlm_loss=1.44255 mlm_acc=67.51759 nsp_loss=0.02410 nsp_acc=99.159 throughput=131.0K tks/s lr=0.0000126 time=131.78 INFO:root:[step 874499] mlm_loss=1.35091 mlm_acc=68.04144 nsp_loss=0.03972 nsp_acc=98.500 throughput=128.0K tks/s lr=0.0000126 time=112.35 INFO:root:[step 874749] mlm_loss=1.71823 mlm_acc=63.78559 nsp_loss=0.02829 nsp_acc=98.944 throughput=148.0K tks/s lr=0.0000125 time=167.79 INFO:root:[step 874999] mlm_loss=1.36794 mlm_acc=67.25336 nsp_loss=0.03562 nsp_acc=98.709 throughput=135.0K tks/s lr=0.0000125 time=115.70 INFO:root:[step 874999] Saving checkpoints to /home/ubuntu/ckpt-master/0874999.params, /home/ubuntu/ckpt-master/0874999.states. INFO:root:[step 875249] mlm_loss=1.63807 mlm_acc=65.87457 nsp_loss=0.01795 nsp_acc=99.373 throughput=133.0K tks/s lr=0.0000125 time=161.67 INFO:root:[step 875499] mlm_loss=1.23379 mlm_acc=69.56976 nsp_loss=0.03421 nsp_acc=98.752 throughput=111.0K tks/s lr=0.0000125 time=116.26 INFO:root:[step 875749] mlm_loss=1.42977 mlm_acc=67.71265 nsp_loss=0.02633 nsp_acc=99.053 throughput=133.0K tks/s lr=0.0000124 time=121.16 INFO:root:[step 875999] mlm_loss=1.51744 mlm_acc=67.06638 nsp_loss=0.01855 nsp_acc=99.353 throughput=140.0K tks/s lr=0.0000124 time=133.97 INFO:root:[step 876249] mlm_loss=1.73344 mlm_acc=64.45337 nsp_loss=0.03097 nsp_acc=98.796 throughput=143.0K tks/s lr=0.0000124 time=142.46 INFO:root:[step 876499] mlm_loss=1.41431 mlm_acc=67.72640 nsp_loss=0.03169 nsp_acc=98.858 throughput=117.0K tks/s lr=0.0000124 time=118.93 INFO:root:[step 876749] mlm_loss=1.37089 mlm_acc=68.69956 nsp_loss=0.02494 nsp_acc=99.146 throughput=126.0K tks/s lr=0.0000123 time=113.40 INFO:root:[step 876999] mlm_loss=1.45983 mlm_acc=68.07809 nsp_loss=0.02050 nsp_acc=99.303 throughput=127.0K tks/s lr=0.0000123 time=124.07 INFO:root:[step 877249] mlm_loss=1.57963 mlm_acc=66.72062 nsp_loss=0.01550 nsp_acc=99.451 throughput=145.0K tks/s lr=0.0000123 time=139.81 INFO:root:[step 877499] mlm_loss=1.35022 mlm_acc=68.72839 nsp_loss=0.02602 nsp_acc=99.143 throughput=131.0K tks/s lr=0.0000123 time=116.78 INFO:root:[step 877749] mlm_loss=1.44877 mlm_acc=67.42015 nsp_loss=0.02139 nsp_acc=99.263 throughput=134.0K tks/s lr=0.0000122 time=131.77 INFO:root:[step 878249] mlm_loss=3.09584 mlm_acc=65.48995 nsp_loss=0.06027 nsp_acc=98.880 throughput=149.0K tks/s lr=0.0000122 time=300.78 INFO:root:[step 878499] mlm_loss=1.51134 mlm_acc=66.30961 nsp_loss=0.02666 nsp_acc=99.051 throughput=136.0K tks/s lr=0.0000122 time=132.40 INFO:root:[step 878749] mlm_loss=1.46017 mlm_acc=67.00048 nsp_loss=0.02488 nsp_acc=99.161 throughput=134.0K tks/s lr=0.0000121 time=139.08 INFO:root:[step 878999] mlm_loss=1.31476 mlm_acc=69.58071 nsp_loss=0.02715 nsp_acc=99.068 throughput=120.0K tks/s lr=0.0000121 time=119.54 INFO:root:[step 879249] mlm_loss=1.46690 mlm_acc=67.56844 nsp_loss=0.02068 nsp_acc=99.277 throughput=142.0K tks/s lr=0.0000121 time=121.56 INFO:root:[step 879499] mlm_loss=1.44312 mlm_acc=66.73209 nsp_loss=0.03066 nsp_acc=98.900 throughput=132.0K tks/s lr=0.0000121 time=129.36 INFO:root:[step 879749] mlm_loss=1.71109 mlm_acc=63.91405 nsp_loss=0.03163 nsp_acc=98.803 throughput=154.0K tks/s lr=0.0000120 time=159.49 INFO:root:[step 879999] mlm_loss=1.55442 mlm_acc=67.28542 nsp_loss=0.01714 nsp_acc=99.415 throughput=140.0K tks/s lr=0.0000120 time=137.23 INFO:root:[step 879999] Saving checkpoints to /home/ubuntu/ckpt-master/0879999.params, /home/ubuntu/ckpt-master/0879999.states. INFO:root:[step 880249] mlm_loss=1.53429 mlm_acc=67.30479 nsp_loss=0.01856 nsp_acc=99.359 throughput=120.0K tks/s lr=0.0000120 time=144.72 INFO:root:[step 880499] mlm_loss=1.59418 mlm_acc=66.16503 nsp_loss=0.02560 nsp_acc=99.030 throughput=149.0K tks/s lr=0.0000120 time=147.32 INFO:root:[step 880749] mlm_loss=1.58635 mlm_acc=66.12100 nsp_loss=0.03367 nsp_acc=98.746 throughput=154.0K tks/s lr=0.0000119 time=151.27 INFO:root:[step 880999] mlm_loss=1.37408 mlm_acc=67.85431 nsp_loss=0.02876 nsp_acc=98.961 throughput=123.0K tks/s lr=0.0000119 time=123.67 INFO:root:[step 881249] mlm_loss=1.44627 mlm_acc=67.24610 nsp_loss=0.02678 nsp_acc=99.008 throughput=129.0K tks/s lr=0.0000119 time=130.79 INFO:root:[step 881499] mlm_loss=1.59173 mlm_acc=65.65118 nsp_loss=0.03412 nsp_acc=98.741 throughput=146.0K tks/s lr=0.0000119 time=136.74 INFO:root:[step 881749] mlm_loss=1.41995 mlm_acc=66.55717 nsp_loss=0.02638 nsp_acc=99.044 throughput=142.0K tks/s lr=0.0000118 time=131.88 INFO:root:[step 881999] mlm_loss=1.47329 mlm_acc=66.20656 nsp_loss=0.04906 nsp_acc=98.100 throughput=131.0K tks/s lr=0.0000118 time=135.59 INFO:root:[step 882249] mlm_loss=1.58585 mlm_acc=64.78085 nsp_loss=0.03243 nsp_acc=98.779 throughput=154.0K tks/s lr=0.0000118 time=150.91 INFO:root:[step 882499] mlm_loss=1.47845 mlm_acc=67.33437 nsp_loss=0.02124 nsp_acc=99.257 throughput=129.0K tks/s lr=0.0000118 time=131.19 INFO:root:[step 882749] mlm_loss=1.33104 mlm_acc=69.13616 nsp_loss=0.02615 nsp_acc=99.106 throughput=125.0K tks/s lr=0.0000117 time=108.87 INFO:root:[step 882999] mlm_loss=1.52669 mlm_acc=66.55410 nsp_loss=0.04941 nsp_acc=97.932 throughput=142.0K tks/s lr=0.0000117 time=137.23 INFO:root:[step 883249] mlm_loss=1.66365 mlm_acc=64.89957 nsp_loss=0.04439 nsp_acc=98.280 throughput=143.0K tks/s lr=0.0000117 time=138.33 INFO:root:[step 883499] mlm_loss=1.50644 mlm_acc=67.44761 nsp_loss=0.01859 nsp_acc=99.359 throughput=135.0K tks/s lr=0.0000117 time=131.39 INFO:root:[step 883749] mlm_loss=1.48002 mlm_acc=67.81309 nsp_loss=0.02156 nsp_acc=99.229 throughput=130.0K tks/s lr=0.0000116 time=127.62 INFO:root:[step 883999] mlm_loss=1.44394 mlm_acc=68.12860 nsp_loss=0.02274 nsp_acc=99.206 throughput=130.0K tks/s lr=0.0000116 time=116.08 INFO:root:[step 884249] mlm_loss=1.38873 mlm_acc=68.97251 nsp_loss=0.02626 nsp_acc=99.051 throughput=114.0K tks/s lr=0.0000116 time=119.49 INFO:root:[step 884499] mlm_loss=1.38203 mlm_acc=67.58310 nsp_loss=0.03564 nsp_acc=98.698 throughput=140.0K tks/s lr=0.0000116 time=120.33 INFO:root:[step 884749] mlm_loss=1.54205 mlm_acc=67.06542 nsp_loss=0.02336 nsp_acc=99.182 throughput=136.0K tks/s lr=0.0000115 time=135.68 INFO:root:[step 884999] mlm_loss=1.36065 mlm_acc=68.79266 nsp_loss=0.02637 nsp_acc=99.084 throughput=127.0K tks/s lr=0.0000115 time=111.57 INFO:root:[step 884999] Saving checkpoints to /home/ubuntu/ckpt-master/0884999.params, /home/ubuntu/ckpt-master/0884999.states. INFO:root:[step 885249] mlm_loss=1.59597 mlm_acc=64.79819 nsp_loss=0.02931 nsp_acc=98.927 throughput=137.0K tks/s lr=0.0000115 time=182.79 INFO:root:[step 885499] mlm_loss=1.42009 mlm_acc=68.36597 nsp_loss=0.02404 nsp_acc=99.152 throughput=132.0K tks/s lr=0.0000115 time=116.18 INFO:root:[step 885749] mlm_loss=1.52041 mlm_acc=65.34460 nsp_loss=0.03683 nsp_acc=98.574 throughput=132.0K tks/s lr=0.0000114 time=135.71 INFO:root:[step 885999] mlm_loss=1.46044 mlm_acc=66.09532 nsp_loss=0.03287 nsp_acc=98.815 throughput=134.0K tks/s lr=0.0000114 time=131.95 INFO:root:[step 886249] mlm_loss=1.43303 mlm_acc=68.26975 nsp_loss=0.02492 nsp_acc=99.149 throughput=131.0K tks/s lr=0.0000114 time=112.51 INFO:root:[step 886499] mlm_loss=1.12503 mlm_acc=71.02136 nsp_loss=0.03998 nsp_acc=98.581 throughput=103.0K tks/s lr=0.0000114 time=102.67 INFO:root:[step 886749] mlm_loss=1.40291 mlm_acc=68.28672 nsp_loss=0.02406 nsp_acc=99.163 throughput=125.0K tks/s lr=0.0000113 time=123.94 INFO:root:[step 886999] mlm_loss=1.51560 mlm_acc=67.12532 nsp_loss=0.02002 nsp_acc=99.256 throughput=135.0K tks/s lr=0.0000113 time=134.29 INFO:root:[step 887249] mlm_loss=1.34625 mlm_acc=69.16854 nsp_loss=0.02849 nsp_acc=99.006 throughput=122.0K tks/s lr=0.0000113 time=109.19 INFO:root:[step 887499] mlm_loss=1.28856 mlm_acc=69.25508 nsp_loss=0.03284 nsp_acc=98.848 throughput=118.0K tks/s lr=0.0000113 time=108.69 INFO:root:[step 887749] mlm_loss=1.55103 mlm_acc=67.06453 nsp_loss=0.01796 nsp_acc=99.391 throughput=139.0K tks/s lr=0.0000112 time=145.65 INFO:root:[step 887999] mlm_loss=1.46865 mlm_acc=66.11862 nsp_loss=0.03297 nsp_acc=98.759 throughput=140.0K tks/s lr=0.0000112 time=133.04 INFO:root:[step 888249] mlm_loss=1.54866 mlm_acc=66.39227 nsp_loss=0.03000 nsp_acc=98.890 throughput=142.0K tks/s lr=0.0000112 time=157.03 INFO:root:[step 888499] mlm_loss=1.39499 mlm_acc=68.66525 nsp_loss=0.02638 nsp_acc=99.048 throughput=127.0K tks/s lr=0.0000112 time=116.00 INFO:root:[step 888749] mlm_loss=1.31326 mlm_acc=69.38499 nsp_loss=0.02763 nsp_acc=99.053 throughput=123.0K tks/s lr=0.0000111 time=108.50 INFO:root:[step 888999] mlm_loss=1.52344 mlm_acc=67.21529 nsp_loss=0.03717 nsp_acc=98.538 throughput=140.0K tks/s lr=0.0000111 time=131.90 INFO:root:[step 889249] mlm_loss=1.38620 mlm_acc=68.08458 nsp_loss=0.04118 nsp_acc=98.438 throughput=121.0K tks/s lr=0.0000111 time=123.05 INFO:root:[step 889499] mlm_loss=1.50366 mlm_acc=66.70962 nsp_loss=0.03485 nsp_acc=98.687 throughput=146.0K tks/s lr=0.0000111 time=145.28 INFO:root:[step 889749] mlm_loss=1.30660 mlm_acc=69.05888 nsp_loss=0.02936 nsp_acc=98.967 throughput=120.0K tks/s lr=0.0000110 time=110.62 INFO:root:[step 889999] mlm_loss=1.49674 mlm_acc=66.78679 nsp_loss=0.02176 nsp_acc=99.227 throughput=149.0K tks/s lr=0.0000110 time=143.52 INFO:root:[step 889999] Saving checkpoints to /home/ubuntu/ckpt-master/0889999.params, /home/ubuntu/ckpt-master/0889999.states. INFO:root:[step 890249] mlm_loss=1.48439 mlm_acc=67.47687 nsp_loss=0.03686 nsp_acc=98.598 throughput=122.0K tks/s lr=0.0000110 time=153.56 INFO:root:[step 890499] mlm_loss=1.47916 mlm_acc=67.25077 nsp_loss=0.03352 nsp_acc=98.730 throughput=131.0K tks/s lr=0.0000110 time=131.34 INFO:root:[step 890749] mlm_loss=1.61208 mlm_acc=65.94221 nsp_loss=0.06059 nsp_acc=97.548 throughput=140.0K tks/s lr=0.0000109 time=143.16 INFO:root:[step 890999] mlm_loss=1.46181 mlm_acc=67.78661 nsp_loss=0.02035 nsp_acc=99.279 throughput=140.0K tks/s lr=0.0000109 time=123.20 INFO:root:[step 891249] mlm_loss=1.33015 mlm_acc=69.24973 nsp_loss=0.02774 nsp_acc=99.075 throughput=118.0K tks/s lr=0.0000109 time=121.09 INFO:root:[step 891499] mlm_loss=1.38770 mlm_acc=68.61215 nsp_loss=0.02890 nsp_acc=98.941 throughput=125.0K tks/s lr=0.0000109 time=112.42 INFO:root:[step 891749] mlm_loss=1.18904 mlm_acc=70.36486 nsp_loss=0.04200 nsp_acc=98.507 throughput=115.0K tks/s lr=0.0000108 time=107.55 INFO:root:[step 891999] mlm_loss=1.47692 mlm_acc=67.06469 nsp_loss=0.03275 nsp_acc=98.767 throughput=131.0K tks/s lr=0.0000108 time=129.81 INFO:root:[step 892249] mlm_loss=1.74174 mlm_acc=63.47703 nsp_loss=0.03629 nsp_acc=98.633 throughput=152.0K tks/s lr=0.0000108 time=174.27 INFO:root:[step 892499] mlm_loss=1.36493 mlm_acc=68.81817 nsp_loss=0.02561 nsp_acc=99.130 throughput=126.0K tks/s lr=0.0000108 time=110.50 INFO:root:[step 892749] mlm_loss=1.50656 mlm_acc=67.23173 nsp_loss=0.01943 nsp_acc=99.316 throughput=132.0K tks/s lr=0.0000107 time=133.36 INFO:root:[step 892999] mlm_loss=1.33596 mlm_acc=69.12791 nsp_loss=0.02749 nsp_acc=99.041 throughput=123.0K tks/s lr=0.0000107 time=107.75 INFO:root:[step 893249] mlm_loss=1.31227 mlm_acc=69.33462 nsp_loss=0.03869 nsp_acc=98.559 throughput=109.0K tks/s lr=0.0000107 time=106.23 INFO:root:[step 893499] mlm_loss=1.32941 mlm_acc=68.66724 nsp_loss=0.04070 nsp_acc=98.523 throughput=113.0K tks/s lr=0.0000107 time=114.51 INFO:root:[step 893749] mlm_loss=1.68922 mlm_acc=64.86536 nsp_loss=0.03677 nsp_acc=98.581 throughput=152.0K tks/s lr=0.0000106 time=151.14 INFO:root:[step 893999] mlm_loss=1.90346 mlm_acc=61.70657 nsp_loss=0.05000 nsp_acc=98.078 throughput=137.0K tks/s lr=0.0000106 time=142.28 INFO:root:[step 894249] mlm_loss=1.47228 mlm_acc=67.74900 nsp_loss=0.02121 nsp_acc=99.254 throughput=137.0K tks/s lr=0.0000106 time=120.82 INFO:root:[step 894499] mlm_loss=1.32998 mlm_acc=69.35234 nsp_loss=0.02746 nsp_acc=99.053 throughput=112.0K tks/s lr=0.0000106 time=115.64 INFO:root:[step 894749] mlm_loss=1.41749 mlm_acc=66.98197 nsp_loss=0.02870 nsp_acc=98.988 throughput=144.0K tks/s lr=0.0000105 time=126.57 INFO:root:[step 894999] mlm_loss=1.34244 mlm_acc=68.60799 nsp_loss=0.03011 nsp_acc=98.960 throughput=118.0K tks/s lr=0.0000105 time=119.92 INFO:root:[step 894999] Saving checkpoints to /home/ubuntu/ckpt-master/0894999.params, /home/ubuntu/ckpt-master/0894999.states. INFO:root:[step 895249] mlm_loss=1.34465 mlm_acc=68.92751 nsp_loss=0.02545 nsp_acc=99.126 throughput=109.0K tks/s lr=0.0000105 time=125.98 INFO:root:[step 895499] mlm_loss=1.46062 mlm_acc=67.89915 nsp_loss=0.02322 nsp_acc=99.174 throughput=127.0K tks/s lr=0.0000105 time=124.81 INFO:root:[step 895749] mlm_loss=1.61701 mlm_acc=65.22221 nsp_loss=0.03729 nsp_acc=98.589 throughput=136.0K tks/s lr=0.0000104 time=136.41 INFO:root:[step 895999] mlm_loss=1.33143 mlm_acc=69.33646 nsp_loss=0.02838 nsp_acc=99.017 throughput=122.0K tks/s lr=0.0000104 time=109.49 INFO:root:[step 896249] mlm_loss=1.48739 mlm_acc=66.79201 nsp_loss=0.05594 nsp_acc=97.801 throughput=137.0K tks/s lr=0.0000104 time=134.93 INFO:root:[step 896499] mlm_loss=1.65672 mlm_acc=64.34166 nsp_loss=0.04312 nsp_acc=98.332 throughput=133.0K tks/s lr=0.0000104 time=121.33 INFO:root:[step 896749] mlm_loss=1.51071 mlm_acc=67.65879 nsp_loss=0.01793 nsp_acc=99.379 throughput=141.0K tks/s lr=0.0000103 time=137.24 INFO:root:[step 896999] mlm_loss=1.61806 mlm_acc=65.34188 nsp_loss=0.09126 nsp_acc=96.180 throughput=148.0K tks/s lr=0.0000103 time=151.24 INFO:root:[step 897249] mlm_loss=1.55926 mlm_acc=66.71176 nsp_loss=0.02217 nsp_acc=99.213 throughput=139.0K tks/s lr=0.0000103 time=137.12 INFO:root:[step 897499] mlm_loss=1.50141 mlm_acc=65.89995 nsp_loss=0.04042 nsp_acc=98.482 throughput=137.0K tks/s lr=0.0000103 time=137.20 INFO:root:[step 897749] mlm_loss=1.50459 mlm_acc=67.01201 nsp_loss=0.02336 nsp_acc=99.161 throughput=137.0K tks/s lr=0.0000102 time=132.09 INFO:root:[step 897999] mlm_loss=1.61503 mlm_acc=64.74865 nsp_loss=0.04221 nsp_acc=98.395 throughput=148.0K tks/s lr=0.0000102 time=152.66 INFO:root:[step 898249] mlm_loss=1.45212 mlm_acc=68.04570 nsp_loss=0.02086 nsp_acc=99.273 throughput=134.0K tks/s lr=0.0000102 time=126.77 INFO:root:[step 898499] mlm_loss=1.58074 mlm_acc=65.48894 nsp_loss=0.02025 nsp_acc=99.294 throughput=146.0K tks/s lr=0.0000102 time=149.85 INFO:root:[step 898749] mlm_loss=1.26819 mlm_acc=69.54419 nsp_loss=0.03195 nsp_acc=98.910 throughput=116.0K tks/s lr=0.0000101 time=109.68 INFO:root:[step 898999] mlm_loss=1.39690 mlm_acc=68.47099 nsp_loss=0.02307 nsp_acc=99.215 throughput=123.0K tks/s lr=0.0000101 time=122.96 INFO:root:[step 899249] mlm_loss=1.38435 mlm_acc=67.85486 nsp_loss=0.03847 nsp_acc=98.547 throughput=135.0K tks/s lr=0.0000101 time=113.85 INFO:root:[step 899499] mlm_loss=1.52215 mlm_acc=66.77412 nsp_loss=0.03025 nsp_acc=98.853 throughput=133.0K tks/s lr=0.0000101 time=136.48 INFO:root:[step 899749] mlm_loss=1.35347 mlm_acc=68.99150 nsp_loss=0.02790 nsp_acc=99.023 throughput=124.0K tks/s lr=0.0000100 time=109.22 INFO:root:[step 899999] mlm_loss=1.36615 mlm_acc=68.85261 nsp_loss=0.02742 nsp_acc=99.071 throughput=116.0K tks/s lr=0.0000100 time=119.00 INFO:root:[step 899999] Saving checkpoints to /home/ubuntu/ckpt-master/0899999.params, /home/ubuntu/ckpt-master/0899999.states. INFO:root:[step 900249] mlm_loss=1.42072 mlm_acc=68.41830 nsp_loss=0.02289 nsp_acc=99.185 throughput=118.0K tks/s lr=0.0000100 time=128.46 INFO:root:[step 900499] mlm_loss=1.50252 mlm_acc=66.62085 nsp_loss=0.03342 nsp_acc=98.730 throughput=142.0K tks/s lr=0.0000100 time=141.52 INFO:root:[step 900749] mlm_loss=1.49078 mlm_acc=66.95106 nsp_loss=0.02010 nsp_acc=99.295 throughput=137.0K tks/s lr=0.0000099 time=133.65 INFO:root:[step 900999] mlm_loss=1.40440 mlm_acc=68.49751 nsp_loss=0.02502 nsp_acc=99.083 throughput=128.0K tks/s lr=0.0000099 time=116.45 INFO:root:[step 901249] mlm_loss=1.41696 mlm_acc=68.47663 nsp_loss=0.02335 nsp_acc=99.170 throughput=119.0K tks/s lr=0.0000099 time=120.08 INFO:root:[step 901499] mlm_loss=1.28367 mlm_acc=69.29909 nsp_loss=0.03323 nsp_acc=98.881 throughput=121.0K tks/s lr=0.0000099 time=111.23 INFO:root:[step 901749] mlm_loss=1.57682 mlm_acc=64.00416 nsp_loss=0.05347 nsp_acc=97.955 throughput=147.0K tks/s lr=0.0000098 time=143.45 INFO:root:[step 901999] mlm_loss=1.64157 mlm_acc=65.57703 nsp_loss=0.08911 nsp_acc=96.281 throughput=137.0K tks/s lr=0.0000098 time=138.04 INFO:root:[step 902249] mlm_loss=1.66865 mlm_acc=64.63226 nsp_loss=0.04170 nsp_acc=98.396 throughput=156.0K tks/s lr=0.0000098 time=157.66 INFO:root:[step 902499] mlm_loss=1.39317 mlm_acc=67.94477 nsp_loss=0.02472 nsp_acc=99.152 throughput=120.0K tks/s lr=0.0000098 time=124.85 INFO:root:[step 902749] mlm_loss=1.38078 mlm_acc=68.76490 nsp_loss=0.02681 nsp_acc=99.077 throughput=127.0K tks/s lr=0.0000097 time=110.63 INFO:root:[step 902999] mlm_loss=1.42733 mlm_acc=68.18075 nsp_loss=0.02444 nsp_acc=99.126 throughput=122.0K tks/s lr=0.0000097 time=119.05 INFO:root:[step 903249] mlm_loss=1.43292 mlm_acc=68.16952 nsp_loss=0.02122 nsp_acc=99.244 throughput=134.0K tks/s lr=0.0000097 time=119.74 INFO:root:[step 903499] mlm_loss=1.73920 mlm_acc=62.89386 nsp_loss=0.05033 nsp_acc=97.984 throughput=149.0K tks/s lr=0.0000097 time=149.73 INFO:root:[step 903749] mlm_loss=1.53506 mlm_acc=65.44619 nsp_loss=0.03049 nsp_acc=98.883 throughput=139.0K tks/s lr=0.0000096 time=141.28 INFO:root:[step 903999] mlm_loss=1.33294 mlm_acc=69.21631 nsp_loss=0.02527 nsp_acc=99.142 throughput=118.0K tks/s lr=0.0000096 time=119.19 INFO:root:[step 904249] mlm_loss=1.60753 mlm_acc=65.58667 nsp_loss=0.02443 nsp_acc=99.087 throughput=150.0K tks/s lr=0.0000096 time=147.39 INFO:root:[step 904499] mlm_loss=1.66737 mlm_acc=64.92813 nsp_loss=0.03389 nsp_acc=98.659 throughput=157.0K tks/s lr=0.0000096 time=157.44 INFO:root:[step 904749] mlm_loss=1.55288 mlm_acc=65.61472 nsp_loss=0.03766 nsp_acc=98.547 throughput=142.0K tks/s lr=0.0000095 time=139.88 INFO:root:[step 904999] mlm_loss=1.50518 mlm_acc=67.89476 nsp_loss=0.01896 nsp_acc=99.331 throughput=136.0K tks/s lr=0.0000095 time=131.10 INFO:root:[step 904999] Saving checkpoints to /home/ubuntu/ckpt-master/0904999.params, /home/ubuntu/ckpt-master/0904999.states. INFO:root:[step 905249] mlm_loss=1.52974 mlm_acc=66.48128 nsp_loss=0.02889 nsp_acc=98.932 throughput=134.0K tks/s lr=0.0000095 time=160.69 INFO:root:[step 905499] mlm_loss=1.49489 mlm_acc=67.76468 nsp_loss=0.02017 nsp_acc=99.289 throughput=133.0K tks/s lr=0.0000095 time=129.40 INFO:root:[step 905749] mlm_loss=1.23359 mlm_acc=70.10552 nsp_loss=0.03586 nsp_acc=98.718 throughput=110.0K tks/s lr=0.0000094 time=107.29 INFO:root:[step 905999] mlm_loss=1.04206 mlm_acc=75.63034 nsp_loss=0.03998 nsp_acc=98.682 throughput=128.0K tks/s lr=0.0000094 time=127.90 INFO:root:[step 906249] mlm_loss=1.67090 mlm_acc=64.63712 nsp_loss=0.02408 nsp_acc=99.071 throughput=155.0K tks/s lr=0.0000094 time=156.21 INFO:root:[step 906499] mlm_loss=1.52829 mlm_acc=66.37396 nsp_loss=0.02220 nsp_acc=99.213 throughput=140.0K tks/s lr=0.0000094 time=135.53 INFO:root:[step 906749] mlm_loss=1.52486 mlm_acc=66.22329 nsp_loss=0.02660 nsp_acc=99.059 throughput=146.0K tks/s lr=0.0000093 time=151.11 INFO:root:[step 906999] mlm_loss=1.30173 mlm_acc=69.67542 nsp_loss=0.02937 nsp_acc=98.996 throughput=116.0K tks/s lr=0.0000093 time=108.59 INFO:root:[step 907249] mlm_loss=1.41456 mlm_acc=68.36435 nsp_loss=0.02390 nsp_acc=99.192 throughput=123.0K tks/s lr=0.0000093 time=120.48 INFO:root:[step 907499] mlm_loss=1.43006 mlm_acc=68.14935 nsp_loss=0.02059 nsp_acc=99.258 throughput=135.0K tks/s lr=0.0000093 time=119.28 INFO:root:[step 907749] mlm_loss=1.49639 mlm_acc=67.79173 nsp_loss=0.01924 nsp_acc=99.337 throughput=134.0K tks/s lr=0.0000092 time=131.54 INFO:root:[step 907999] mlm_loss=1.55377 mlm_acc=66.87928 nsp_loss=0.01737 nsp_acc=99.398 throughput=141.0K tks/s lr=0.0000092 time=135.26 INFO:root:[step 908249] mlm_loss=1.51153 mlm_acc=67.77997 nsp_loss=0.01717 nsp_acc=99.432 throughput=140.0K tks/s lr=0.0000092 time=137.91 INFO:root:[step 908499] mlm_loss=1.60672 mlm_acc=66.18576 nsp_loss=0.02713 nsp_acc=98.974 throughput=148.0K tks/s lr=0.0000092 time=144.70 INFO:root:[step 908749] mlm_loss=1.50969 mlm_acc=67.02423 nsp_loss=0.02500 nsp_acc=99.148 throughput=132.0K tks/s lr=0.0000091 time=130.09 INFO:root:[step 908999] mlm_loss=1.42965 mlm_acc=68.30883 nsp_loss=0.02070 nsp_acc=99.292 throughput=126.0K tks/s lr=0.0000091 time=127.38 INFO:root:[step 909249] mlm_loss=1.56423 mlm_acc=64.91140 nsp_loss=0.02546 nsp_acc=99.100 throughput=147.0K tks/s lr=0.0000091 time=128.55 INFO:root:[step 909499] mlm_loss=1.57036 mlm_acc=65.76987 nsp_loss=0.03362 nsp_acc=98.740 throughput=140.0K tks/s lr=0.0000091 time=138.75 INFO:root:[step 909749] mlm_loss=1.43093 mlm_acc=67.26219 nsp_loss=0.03270 nsp_acc=98.762 throughput=129.0K tks/s lr=0.0000090 time=131.69 INFO:root:[step 909999] mlm_loss=1.46550 mlm_acc=66.02406 nsp_loss=0.04865 nsp_acc=98.116 throughput=133.0K tks/s lr=0.0000090 time=135.37 INFO:root:[step 909999] Saving checkpoints to /home/ubuntu/ckpt-master/0909999.params, /home/ubuntu/ckpt-master/0909999.states. INFO:root:[step 910249] mlm_loss=1.26988 mlm_acc=70.31031 nsp_loss=0.03276 nsp_acc=98.867 throughput=107.0K tks/s lr=0.0000090 time=122.87 INFO:root:[step 910499] mlm_loss=1.49199 mlm_acc=66.49296 nsp_loss=0.05755 nsp_acc=97.816 throughput=137.0K tks/s lr=0.0000090 time=134.18 INFO:root:[step 910749] mlm_loss=1.53168 mlm_acc=67.47343 nsp_loss=0.01980 nsp_acc=99.317 throughput=132.0K tks/s lr=0.0000089 time=132.17 INFO:root:[step 910999] mlm_loss=1.50398 mlm_acc=67.30409 nsp_loss=0.05057 nsp_acc=98.023 throughput=145.0K tks/s lr=0.0000089 time=128.77 INFO:root:[step 911249] mlm_loss=1.46309 mlm_acc=68.14549 nsp_loss=0.02198 nsp_acc=99.262 throughput=128.0K tks/s lr=0.0000089 time=125.12 INFO:root:[step 911499] mlm_loss=1.38896 mlm_acc=68.90130 nsp_loss=0.02568 nsp_acc=99.088 throughput=123.0K tks/s lr=0.0000089 time=109.39 INFO:root:[step 911749] mlm_loss=1.48141 mlm_acc=67.27505 nsp_loss=0.03541 nsp_acc=98.704 throughput=138.0K tks/s lr=0.0000088 time=134.13 INFO:root:[step 911999] mlm_loss=1.34120 mlm_acc=68.27011 nsp_loss=0.03548 nsp_acc=98.755 throughput=127.0K tks/s lr=0.0000088 time=126.34 INFO:root:[step 912249] mlm_loss=1.63750 mlm_acc=65.49599 nsp_loss=0.02968 nsp_acc=98.882 throughput=153.0K tks/s lr=0.0000088 time=150.75 INFO:root:[step 912499] mlm_loss=1.54269 mlm_acc=66.71522 nsp_loss=0.03177 nsp_acc=98.789 throughput=150.0K tks/s lr=0.0000088 time=144.28 INFO:root:[step 912749] mlm_loss=1.62671 mlm_acc=65.30466 nsp_loss=0.03826 nsp_acc=98.536 throughput=148.0K tks/s lr=0.0000087 time=162.97 INFO:root:[step 912999] mlm_loss=1.47498 mlm_acc=67.88627 nsp_loss=0.02483 nsp_acc=99.102 throughput=137.0K tks/s lr=0.0000087 time=116.87 INFO:root:[step 913249] mlm_loss=1.49828 mlm_acc=66.56779 nsp_loss=0.06355 nsp_acc=97.356 throughput=138.0K tks/s lr=0.0000087 time=139.17 INFO:root:[step 913499] mlm_loss=1.42196 mlm_acc=67.87351 nsp_loss=0.02398 nsp_acc=99.191 throughput=129.0K tks/s lr=0.0000087 time=130.39 INFO:root:[step 913749] mlm_loss=1.36435 mlm_acc=69.02837 nsp_loss=0.02752 nsp_acc=99.018 throughput=123.0K tks/s lr=0.0000086 time=109.92 INFO:root:[step 913999] mlm_loss=1.54223 mlm_acc=66.93778 nsp_loss=0.01892 nsp_acc=99.346 throughput=140.0K tks/s lr=0.0000086 time=136.40 INFO:root:[step 914249] mlm_loss=1.41533 mlm_acc=68.22423 nsp_loss=0.02405 nsp_acc=99.157 throughput=132.0K tks/s lr=0.0000086 time=127.83 INFO:root:[step 914499] mlm_loss=1.33722 mlm_acc=68.06993 nsp_loss=0.03131 nsp_acc=98.929 throughput=130.0K tks/s lr=0.0000086 time=120.75 INFO:root:[step 914749] mlm_loss=1.56412 mlm_acc=65.27406 nsp_loss=0.04430 nsp_acc=98.272 throughput=130.0K tks/s lr=0.0000085 time=130.92 INFO:root:[step 914999] mlm_loss=1.27962 mlm_acc=70.02439 nsp_loss=0.02949 nsp_acc=98.961 throughput=117.0K tks/s lr=0.0000085 time=105.60 INFO:root:[step 914999] Saving checkpoints to /home/ubuntu/ckpt-master/0914999.params, /home/ubuntu/ckpt-master/0914999.states. INFO:root:[step 915249] mlm_loss=1.33002 mlm_acc=69.62153 nsp_loss=0.02625 nsp_acc=99.058 throughput=102.0K tks/s lr=0.0000085 time=131.83 INFO:root:[step 915499] mlm_loss=1.46646 mlm_acc=66.04438 nsp_loss=0.02636 nsp_acc=99.082 throughput=142.0K tks/s lr=0.0000085 time=121.28 INFO:root:[step 915749] mlm_loss=1.47336 mlm_acc=66.91687 nsp_loss=0.02232 nsp_acc=99.242 throughput=132.0K tks/s lr=0.0000084 time=132.40 INFO:root:[step 915999] mlm_loss=1.34186 mlm_acc=69.08883 nsp_loss=0.02622 nsp_acc=99.105 throughput=122.0K tks/s lr=0.0000084 time=110.03 INFO:root:[step 916249] mlm_loss=1.37985 mlm_acc=68.59006 nsp_loss=0.02873 nsp_acc=98.970 throughput=116.0K tks/s lr=0.0000084 time=119.70 INFO:root:[step 916499] mlm_loss=1.58257 mlm_acc=65.51555 nsp_loss=0.04189 nsp_acc=98.399 throughput=138.0K tks/s lr=0.0000084 time=142.39 INFO:root:[step 916749] mlm_loss=1.26595 mlm_acc=69.73488 nsp_loss=0.03185 nsp_acc=98.901 throughput=118.0K tks/s lr=0.0000083 time=107.00 INFO:root:[step 916999] mlm_loss=1.47561 mlm_acc=66.51408 nsp_loss=0.06213 nsp_acc=97.533 throughput=142.0K tks/s lr=0.0000083 time=137.75 INFO:root:[step 917249] mlm_loss=1.78721 mlm_acc=63.12830 nsp_loss=0.05230 nsp_acc=97.893 throughput=145.0K tks/s lr=0.0000083 time=147.59 INFO:root:[step 917499] mlm_loss=1.52291 mlm_acc=67.51845 nsp_loss=0.01878 nsp_acc=99.363 throughput=134.0K tks/s lr=0.0000083 time=133.75 INFO:root:[step 917749] mlm_loss=1.34357 mlm_acc=69.30359 nsp_loss=0.02630 nsp_acc=99.091 throughput=120.0K tks/s lr=0.0000082 time=110.18 INFO:root:[step 917999] mlm_loss=1.44532 mlm_acc=67.35068 nsp_loss=0.02450 nsp_acc=99.138 throughput=132.0K tks/s lr=0.0000082 time=130.13 INFO:root:[step 918249] mlm_loss=1.33258 mlm_acc=69.33127 nsp_loss=0.03180 nsp_acc=98.865 throughput=123.0K tks/s lr=0.0000082 time=109.34 INFO:root:[step 918499] mlm_loss=1.59036 mlm_acc=64.91792 nsp_loss=0.03062 nsp_acc=98.865 throughput=153.0K tks/s lr=0.0000082 time=167.10 INFO:root:[step 918749] mlm_loss=1.57119 mlm_acc=67.15291 nsp_loss=0.01423 nsp_acc=99.509 throughput=148.0K tks/s lr=0.0000081 time=129.48 INFO:root:[step 918999] mlm_loss=1.66499 mlm_acc=64.82931 nsp_loss=0.03141 nsp_acc=98.841 throughput=159.0K tks/s lr=0.0000081 time=174.27 INFO:root:[step 919249] mlm_loss=1.54983 mlm_acc=65.85896 nsp_loss=0.02171 nsp_acc=99.246 throughput=142.0K tks/s lr=0.0000081 time=137.37 INFO:root:[step 919499] mlm_loss=1.51318 mlm_acc=66.15103 nsp_loss=0.01802 nsp_acc=99.386 throughput=136.0K tks/s lr=0.0000081 time=140.09 INFO:root:[step 919749] mlm_loss=1.34000 mlm_acc=69.14640 nsp_loss=0.02471 nsp_acc=99.137 throughput=128.0K tks/s lr=0.0000080 time=113.00 INFO:root:[step 919999] mlm_loss=1.47259 mlm_acc=68.22997 nsp_loss=0.01608 nsp_acc=99.470 throughput=132.0K tks/s lr=0.0000080 time=127.22 INFO:root:[step 919999] Saving checkpoints to /home/ubuntu/ckpt-master/0919999.params, /home/ubuntu/ckpt-master/0919999.states. INFO:root:[step 920249] mlm_loss=1.50776 mlm_acc=67.62756 nsp_loss=0.01456 nsp_acc=99.517 throughput=126.0K tks/s lr=0.0000080 time=150.67 INFO:root:[step 920499] mlm_loss=1.32684 mlm_acc=69.48344 nsp_loss=0.02399 nsp_acc=99.170 throughput=125.0K tks/s lr=0.0000080 time=110.50 INFO:root:[step 920749] mlm_loss=1.46246 mlm_acc=68.05171 nsp_loss=0.01850 nsp_acc=99.383 throughput=127.0K tks/s lr=0.0000079 time=123.84 INFO:root:[step 920999] mlm_loss=1.37243 mlm_acc=68.80527 nsp_loss=0.01837 nsp_acc=99.384 throughput=130.0K tks/s lr=0.0000079 time=116.34 INFO:root:[step 921249] mlm_loss=1.37468 mlm_acc=68.28183 nsp_loss=0.02034 nsp_acc=99.289 throughput=125.0K tks/s lr=0.0000079 time=119.80 INFO:root:[step 921499] mlm_loss=1.50698 mlm_acc=67.35307 nsp_loss=0.01434 nsp_acc=99.511 throughput=137.0K tks/s lr=0.0000079 time=132.71 INFO:root:[step 921749] mlm_loss=1.57791 mlm_acc=66.65063 nsp_loss=0.02527 nsp_acc=99.019 throughput=144.0K tks/s lr=0.0000078 time=144.84 INFO:root:[step 921999] mlm_loss=1.47608 mlm_acc=67.01967 nsp_loss=0.05533 nsp_acc=97.776 throughput=140.0K tks/s lr=0.0000078 time=144.32 INFO:root:[step 922249] mlm_loss=1.29253 mlm_acc=69.67071 nsp_loss=0.02705 nsp_acc=99.051 throughput=122.0K tks/s lr=0.0000078 time=109.14 INFO:root:[step 922499] mlm_loss=1.43531 mlm_acc=67.87705 nsp_loss=0.01976 nsp_acc=99.310 throughput=132.0K tks/s lr=0.0000078 time=131.29 INFO:root:[step 922749] mlm_loss=1.63537 mlm_acc=63.72166 nsp_loss=0.02439 nsp_acc=99.133 throughput=144.0K tks/s lr=0.0000077 time=144.02 INFO:root:[step 922999] mlm_loss=1.72782 mlm_acc=63.87306 nsp_loss=0.01786 nsp_acc=99.336 throughput=155.0K tks/s lr=0.0000077 time=156.28 INFO:root:[step 923249] mlm_loss=1.60533 mlm_acc=65.60688 nsp_loss=0.01534 nsp_acc=99.448 throughput=139.0K tks/s lr=0.0000077 time=155.19 INFO:root:[step 923499] mlm_loss=1.26980 mlm_acc=69.94165 nsp_loss=0.02657 nsp_acc=99.080 throughput=117.0K tks/s lr=0.0000077 time=105.93 INFO:root:[step 923749] mlm_loss=1.49395 mlm_acc=65.55857 nsp_loss=0.03935 nsp_acc=98.507 throughput=142.0K tks/s lr=0.0000076 time=126.44 INFO:root:[step 923999] mlm_loss=1.53330 mlm_acc=67.10329 nsp_loss=0.01397 nsp_acc=99.519 throughput=142.0K tks/s lr=0.0000076 time=137.80 INFO:root:[step 924249] mlm_loss=1.31093 mlm_acc=69.48888 nsp_loss=0.02913 nsp_acc=98.967 throughput=116.0K tks/s lr=0.0000076 time=119.66 INFO:root:[step 924499] mlm_loss=1.34441 mlm_acc=69.03884 nsp_loss=0.02466 nsp_acc=99.181 throughput=133.0K tks/s lr=0.0000076 time=114.02 INFO:root:[step 924749] mlm_loss=1.35019 mlm_acc=68.72833 nsp_loss=0.02814 nsp_acc=98.984 throughput=113.0K tks/s lr=0.0000075 time=120.37 INFO:root:[step 924999] mlm_loss=1.47172 mlm_acc=67.95343 nsp_loss=0.01762 nsp_acc=99.383 throughput=139.0K tks/s lr=0.0000075 time=119.32 INFO:root:[step 924999] Saving checkpoints to /home/ubuntu/ckpt-master/0924999.params, /home/ubuntu/ckpt-master/0924999.states. INFO:root:[step 925249] mlm_loss=1.50473 mlm_acc=67.30456 nsp_loss=0.02027 nsp_acc=99.289 throughput=132.0K tks/s lr=0.0000075 time=175.43 INFO:root:[step 925499] mlm_loss=1.64093 mlm_acc=64.92193 nsp_loss=0.03726 nsp_acc=98.528 throughput=160.0K tks/s lr=0.0000075 time=163.96 INFO:root:[step 925749] mlm_loss=1.60439 mlm_acc=65.39995 nsp_loss=0.02857 nsp_acc=98.947 throughput=149.0K tks/s lr=0.0000074 time=150.88 INFO:root:[step 925999] mlm_loss=1.45425 mlm_acc=68.09518 nsp_loss=0.01898 nsp_acc=99.345 throughput=128.0K tks/s lr=0.0000074 time=127.06 INFO:root:[step 926249] mlm_loss=1.63111 mlm_acc=64.99511 nsp_loss=0.01792 nsp_acc=99.410 throughput=147.0K tks/s lr=0.0000074 time=144.18 INFO:root:[step 926749] mlm_loss=3.25559 mlm_acc=65.28050 nsp_loss=0.02435 nsp_acc=99.570 throughput=152.0K tks/s lr=0.0000073 time=319.54 INFO:root:[step 926999] mlm_loss=1.59017 mlm_acc=66.10603 nsp_loss=0.01862 nsp_acc=99.306 throughput=147.0K tks/s lr=0.0000073 time=163.84 INFO:root:[step 927249] mlm_loss=1.30678 mlm_acc=69.44358 nsp_loss=0.02906 nsp_acc=98.986 throughput=118.0K tks/s lr=0.0000073 time=108.98 INFO:root:[step 927499] mlm_loss=1.40435 mlm_acc=68.40507 nsp_loss=0.01820 nsp_acc=99.383 throughput=137.0K tks/s lr=0.0000073 time=117.90 INFO:root:[step 927749] mlm_loss=1.43503 mlm_acc=66.97463 nsp_loss=0.03663 nsp_acc=98.655 throughput=136.0K tks/s lr=0.0000072 time=137.45 INFO:root:[step 927999] mlm_loss=1.33291 mlm_acc=69.58856 nsp_loss=0.02550 nsp_acc=99.117 throughput=117.0K tks/s lr=0.0000072 time=117.61 INFO:root:[step 928249] mlm_loss=1.45336 mlm_acc=67.88636 nsp_loss=0.01949 nsp_acc=99.335 throughput=137.0K tks/s lr=0.0000072 time=121.91 INFO:root:[step 928499] mlm_loss=1.41132 mlm_acc=68.60455 nsp_loss=0.01940 nsp_acc=99.354 throughput=127.0K tks/s lr=0.0000072 time=123.71 INFO:root:[step 928749] mlm_loss=1.51168 mlm_acc=67.67741 nsp_loss=0.01575 nsp_acc=99.472 throughput=135.0K tks/s lr=0.0000071 time=133.32 INFO:root:[step 928999] mlm_loss=1.45504 mlm_acc=68.32079 nsp_loss=0.01718 nsp_acc=99.436 throughput=135.0K tks/s lr=0.0000071 time=119.83 INFO:root:[step 929249] mlm_loss=1.43356 mlm_acc=67.33557 nsp_loss=0.04131 nsp_acc=98.376 throughput=133.0K tks/s lr=0.0000071 time=135.49 INFO:root:[step 929499] mlm_loss=1.36430 mlm_acc=68.95057 nsp_loss=0.02162 nsp_acc=99.272 throughput=129.0K tks/s lr=0.0000071 time=113.03 INFO:root:[step 929749] mlm_loss=1.45993 mlm_acc=68.06079 nsp_loss=0.01906 nsp_acc=99.342 throughput=128.0K tks/s lr=0.0000070 time=127.44 INFO:root:[step 929999] mlm_loss=1.54810 mlm_acc=66.88271 nsp_loss=0.01525 nsp_acc=99.491 throughput=142.0K tks/s lr=0.0000070 time=136.75 INFO:root:[step 929999] Saving checkpoints to /home/ubuntu/ckpt-master/0929999.params, /home/ubuntu/ckpt-master/0929999.states. INFO:root:[step 930249] mlm_loss=1.49193 mlm_acc=67.70422 nsp_loss=0.01597 nsp_acc=99.429 throughput=121.0K tks/s lr=0.0000070 time=150.25 INFO:root:[step 930499] mlm_loss=1.29107 mlm_acc=69.81255 nsp_loss=0.02762 nsp_acc=99.054 throughput=117.0K tks/s lr=0.0000070 time=106.77 INFO:root:[step 930749] mlm_loss=1.42213 mlm_acc=67.43635 nsp_loss=0.07469 nsp_acc=96.951 throughput=127.0K tks/s lr=0.0000069 time=133.30 INFO:root:[step 930999] mlm_loss=1.35559 mlm_acc=69.12334 nsp_loss=0.02438 nsp_acc=99.175 throughput=125.0K tks/s lr=0.0000069 time=110.85 INFO:root:[step 931249] mlm_loss=1.36434 mlm_acc=68.89988 nsp_loss=0.02264 nsp_acc=99.217 throughput=118.0K tks/s lr=0.0000069 time=119.90 INFO:root:[step 931499] mlm_loss=1.36637 mlm_acc=67.61724 nsp_loss=0.02684 nsp_acc=99.039 throughput=140.0K tks/s lr=0.0000069 time=122.09 INFO:root:[step 931749] mlm_loss=1.26391 mlm_acc=68.44002 nsp_loss=0.04475 nsp_acc=98.322 throughput=113.0K tks/s lr=0.0000068 time=120.97 INFO:root:[step 931999] mlm_loss=1.55909 mlm_acc=65.30332 nsp_loss=0.01914 nsp_acc=99.352 throughput=140.0K tks/s lr=0.0000068 time=142.70 INFO:root:[step 932249] mlm_loss=1.35471 mlm_acc=68.54928 nsp_loss=0.02443 nsp_acc=99.154 throughput=133.0K tks/s lr=0.0000068 time=113.04 INFO:root:[step 932499] mlm_loss=1.53133 mlm_acc=66.20990 nsp_loss=0.04281 nsp_acc=98.296 throughput=141.0K tks/s lr=0.0000068 time=141.30 INFO:root:[step 932749] mlm_loss=1.58034 mlm_acc=65.28571 nsp_loss=0.02544 nsp_acc=99.074 throughput=138.0K tks/s lr=0.0000067 time=139.41 INFO:root:[step 932999] mlm_loss=1.49334 mlm_acc=67.55659 nsp_loss=0.02087 nsp_acc=99.233 throughput=135.0K tks/s lr=0.0000067 time=128.62 INFO:root:[step 933249] mlm_loss=1.59531 mlm_acc=65.70986 nsp_loss=0.03081 nsp_acc=98.824 throughput=143.0K tks/s lr=0.0000067 time=144.72 INFO:root:[step 933499] mlm_loss=1.61333 mlm_acc=65.60222 nsp_loss=0.02478 nsp_acc=99.122 throughput=145.0K tks/s lr=0.0000067 time=147.32 INFO:root:[step 933749] mlm_loss=1.41786 mlm_acc=68.42277 nsp_loss=0.02015 nsp_acc=99.323 throughput=131.0K tks/s lr=0.0000066 time=119.40 INFO:root:[step 933999] mlm_loss=1.53817 mlm_acc=64.88350 nsp_loss=0.03462 nsp_acc=98.745 throughput=133.0K tks/s lr=0.0000066 time=134.58 INFO:root:[step 934249] mlm_loss=1.46894 mlm_acc=66.30825 nsp_loss=0.03802 nsp_acc=98.582 throughput=139.0K tks/s lr=0.0000066 time=136.22 INFO:root:[step 934499] mlm_loss=1.62285 mlm_acc=64.52837 nsp_loss=0.01714 nsp_acc=99.404 throughput=150.0K tks/s lr=0.0000066 time=144.97 INFO:root:[step 934749] mlm_loss=1.60194 mlm_acc=65.78288 nsp_loss=0.01825 nsp_acc=99.352 throughput=150.0K tks/s lr=0.0000065 time=150.40 INFO:root:[step 934999] mlm_loss=1.44764 mlm_acc=66.99287 nsp_loss=0.02868 nsp_acc=98.926 throughput=143.0K tks/s lr=0.0000065 time=142.87 INFO:root:[step 934999] Saving checkpoints to /home/ubuntu/ckpt-master/0934999.params, /home/ubuntu/ckpt-master/0934999.states. INFO:root:[step 935249] mlm_loss=1.45231 mlm_acc=68.17797 nsp_loss=0.01784 nsp_acc=99.396 throughput=119.0K tks/s lr=0.0000065 time=144.44 INFO:root:[step 935499] mlm_loss=1.44607 mlm_acc=68.04350 nsp_loss=0.02192 nsp_acc=99.233 throughput=123.0K tks/s lr=0.0000065 time=127.33 INFO:root:[step 935749] mlm_loss=1.36656 mlm_acc=69.00554 nsp_loss=0.02082 nsp_acc=99.275 throughput=131.0K tks/s lr=0.0000064 time=113.13 INFO:root:[step 935999] mlm_loss=1.54504 mlm_acc=66.95995 nsp_loss=0.01752 nsp_acc=99.399 throughput=148.0K tks/s lr=0.0000064 time=145.15 INFO:root:[step 936249] mlm_loss=1.62527 mlm_acc=65.41474 nsp_loss=0.04590 nsp_acc=98.111 throughput=152.0K tks/s lr=0.0000064 time=153.82 INFO:root:[step 936499] mlm_loss=1.44976 mlm_acc=67.79073 nsp_loss=0.02186 nsp_acc=99.232 throughput=131.0K tks/s lr=0.0000064 time=131.58 INFO:root:[step 936749] mlm_loss=1.50031 mlm_acc=67.57373 nsp_loss=0.01498 nsp_acc=99.467 throughput=138.0K tks/s lr=0.0000063 time=131.76 INFO:root:[step 936999] mlm_loss=1.52977 mlm_acc=66.99648 nsp_loss=0.02000 nsp_acc=99.280 throughput=140.0K tks/s lr=0.0000063 time=135.65 INFO:root:[step 937249] mlm_loss=1.44977 mlm_acc=67.38366 nsp_loss=0.02548 nsp_acc=99.086 throughput=131.0K tks/s lr=0.0000063 time=133.34 INFO:root:[step 937499] mlm_loss=1.36453 mlm_acc=69.08557 nsp_loss=0.02340 nsp_acc=99.196 throughput=131.0K tks/s lr=0.0000063 time=114.02 INFO:root:[step 937749] mlm_loss=1.51781 mlm_acc=67.00720 nsp_loss=0.01476 nsp_acc=99.477 throughput=144.0K tks/s lr=0.0000062 time=136.65 INFO:root:[step 937999] mlm_loss=1.52475 mlm_acc=67.27606 nsp_loss=0.01542 nsp_acc=99.500 throughput=139.0K tks/s lr=0.0000062 time=137.40 INFO:root:[step 938249] mlm_loss=1.31866 mlm_acc=68.98541 nsp_loss=0.03640 nsp_acc=98.662 throughput=115.0K tks/s lr=0.0000062 time=108.58 INFO:root:[step 938499] mlm_loss=1.30234 mlm_acc=69.63952 nsp_loss=0.02867 nsp_acc=98.979 throughput=109.0K tks/s lr=0.0000062 time=115.72 INFO:root:[step 938749] mlm_loss=1.47789 mlm_acc=67.02608 nsp_loss=0.01749 nsp_acc=99.405 throughput=142.0K tks/s lr=0.0000061 time=127.74 INFO:root:[step 938999] mlm_loss=1.42444 mlm_acc=68.05544 nsp_loss=0.01997 nsp_acc=99.296 throughput=131.0K tks/s lr=0.0000061 time=130.96 INFO:root:[step 939249] mlm_loss=1.44477 mlm_acc=67.90435 nsp_loss=0.02081 nsp_acc=99.263 throughput=128.0K tks/s lr=0.0000061 time=129.50 INFO:root:[step 939499] mlm_loss=1.36227 mlm_acc=68.82495 nsp_loss=0.02526 nsp_acc=99.145 throughput=126.0K tks/s lr=0.0000061 time=113.32 INFO:root:[step 939749] mlm_loss=1.56806 mlm_acc=66.87074 nsp_loss=0.01205 nsp_acc=99.579 throughput=144.0K tks/s lr=0.0000060 time=142.70 INFO:root:[step 939999] mlm_loss=1.49519 mlm_acc=66.95062 nsp_loss=0.02538 nsp_acc=99.048 throughput=141.0K tks/s lr=0.0000060 time=138.70 INFO:root:[step 939999] Saving checkpoints to /home/ubuntu/ckpt-master/0939999.params, /home/ubuntu/ckpt-master/0939999.states. INFO:root:[step 940249] mlm_loss=1.51778 mlm_acc=67.92390 nsp_loss=0.01339 nsp_acc=99.551 throughput=130.0K tks/s lr=0.0000060 time=168.72 INFO:root:[step 940499] mlm_loss=1.60671 mlm_acc=65.64659 nsp_loss=0.02497 nsp_acc=99.139 throughput=147.0K tks/s lr=0.0000060 time=149.19 INFO:root:[step 940749] mlm_loss=1.42492 mlm_acc=68.39874 nsp_loss=0.01977 nsp_acc=99.336 throughput=135.0K tks/s lr=0.0000059 time=116.62 INFO:root:[step 940999] mlm_loss=1.70534 mlm_acc=64.38753 nsp_loss=0.04207 nsp_acc=98.391 throughput=147.0K tks/s lr=0.0000059 time=160.11 INFO:root:[step 941249] mlm_loss=1.46577 mlm_acc=66.09060 nsp_loss=0.02851 nsp_acc=98.969 throughput=142.0K tks/s lr=0.0000059 time=136.15 INFO:root:[step 941499] mlm_loss=1.52013 mlm_acc=66.08858 nsp_loss=0.02799 nsp_acc=98.989 throughput=138.0K tks/s lr=0.0000059 time=137.51 INFO:root:[step 941749] mlm_loss=1.41458 mlm_acc=67.95394 nsp_loss=0.02770 nsp_acc=99.002 throughput=127.0K tks/s lr=0.0000058 time=123.50 INFO:root:[step 941999] mlm_loss=1.50306 mlm_acc=66.90924 nsp_loss=0.02821 nsp_acc=98.985 throughput=138.0K tks/s lr=0.0000058 time=139.40 INFO:root:[step 942249] mlm_loss=1.27493 mlm_acc=69.69164 nsp_loss=0.02837 nsp_acc=99.002 throughput=114.0K tks/s lr=0.0000058 time=106.35 INFO:root:[step 942499] mlm_loss=1.32518 mlm_acc=69.46412 nsp_loss=0.02466 nsp_acc=99.156 throughput=123.0K tks/s lr=0.0000058 time=108.81 INFO:root:[step 942749] mlm_loss=1.27528 mlm_acc=71.78940 nsp_loss=0.02461 nsp_acc=99.157 throughput=133.0K tks/s lr=0.0000057 time=133.74 INFO:root:[step 942999] mlm_loss=1.69602 mlm_acc=63.96279 nsp_loss=0.04235 nsp_acc=98.394 throughput=129.0K tks/s lr=0.0000057 time=129.76 INFO:root:[step 943249] mlm_loss=1.42423 mlm_acc=68.50743 nsp_loss=0.01973 nsp_acc=99.324 throughput=134.0K tks/s lr=0.0000057 time=117.02 INFO:root:[step 943499] mlm_loss=1.60694 mlm_acc=65.59524 nsp_loss=0.01526 nsp_acc=99.479 throughput=150.0K tks/s lr=0.0000057 time=149.52 INFO:root:[step 943749] mlm_loss=1.44606 mlm_acc=67.37204 nsp_loss=0.01829 nsp_acc=99.368 throughput=133.0K tks/s lr=0.0000056 time=133.39 INFO:root:[step 943999] mlm_loss=1.50569 mlm_acc=65.85738 nsp_loss=0.03167 nsp_acc=98.822 throughput=132.0K tks/s lr=0.0000056 time=133.93 INFO:root:[step 944249] mlm_loss=1.31587 mlm_acc=69.44554 nsp_loss=0.02606 nsp_acc=99.075 throughput=120.0K tks/s lr=0.0000056 time=107.84 INFO:root:[step 944499] mlm_loss=1.32259 mlm_acc=69.34995 nsp_loss=0.02615 nsp_acc=99.089 throughput=113.0K tks/s lr=0.0000056 time=120.60 INFO:root:[step 944749] mlm_loss=1.33395 mlm_acc=69.54772 nsp_loss=0.02299 nsp_acc=99.212 throughput=120.0K tks/s lr=0.0000055 time=109.05 INFO:root:[step 944999] mlm_loss=1.39098 mlm_acc=68.94251 nsp_loss=0.02024 nsp_acc=99.300 throughput=130.0K tks/s lr=0.0000055 time=115.01 INFO:root:[step 944999] Saving checkpoints to /home/ubuntu/ckpt-master/0944999.params, /home/ubuntu/ckpt-master/0944999.states. INFO:root:[step 945249] mlm_loss=1.42046 mlm_acc=68.58283 nsp_loss=0.02091 nsp_acc=99.312 throughput=110.0K tks/s lr=0.0000055 time=136.52 INFO:root:[step 945499] mlm_loss=1.43040 mlm_acc=68.23534 nsp_loss=0.01911 nsp_acc=99.374 throughput=134.0K tks/s lr=0.0000055 time=119.41 INFO:root:[step 945749] mlm_loss=1.50922 mlm_acc=65.94403 nsp_loss=0.02759 nsp_acc=99.026 throughput=137.0K tks/s lr=0.0000054 time=135.21 INFO:root:[step 945999] mlm_loss=1.39761 mlm_acc=68.57390 nsp_loss=0.02121 nsp_acc=99.251 throughput=125.0K tks/s lr=0.0000054 time=122.77 INFO:root:[step 946249] mlm_loss=1.57171 mlm_acc=66.95769 nsp_loss=0.01314 nsp_acc=99.563 throughput=144.0K tks/s lr=0.0000054 time=138.78 INFO:root:[step 946499] mlm_loss=1.35779 mlm_acc=68.93271 nsp_loss=0.02323 nsp_acc=99.205 throughput=126.0K tks/s lr=0.0000054 time=117.03 INFO:root:[step 946749] mlm_loss=1.79252 mlm_acc=62.63881 nsp_loss=0.04996 nsp_acc=98.030 throughput=146.0K tks/s lr=0.0000053 time=146.21 INFO:root:[step 946999] mlm_loss=1.40544 mlm_acc=67.98648 nsp_loss=0.02839 nsp_acc=98.988 throughput=120.0K tks/s lr=0.0000053 time=125.16 INFO:root:[step 947249] mlm_loss=1.56063 mlm_acc=65.77792 nsp_loss=0.02776 nsp_acc=98.966 throughput=143.0K tks/s lr=0.0000053 time=145.08 INFO:root:[step 947499] mlm_loss=1.34098 mlm_acc=69.16287 nsp_loss=0.02676 nsp_acc=99.071 throughput=124.0K tks/s lr=0.0000053 time=109.81 INFO:root:[step 947749] mlm_loss=1.33966 mlm_acc=69.21755 nsp_loss=0.02854 nsp_acc=99.015 throughput=113.0K tks/s lr=0.0000052 time=118.17 INFO:root:[step 947999] mlm_loss=1.37614 mlm_acc=68.83557 nsp_loss=0.02363 nsp_acc=99.174 throughput=130.0K tks/s lr=0.0000052 time=113.22 INFO:root:[step 948249] mlm_loss=1.58599 mlm_acc=65.73312 nsp_loss=0.01408 nsp_acc=99.514 throughput=148.0K tks/s lr=0.0000052 time=143.88 INFO:root:[step 948499] mlm_loss=1.54683 mlm_acc=66.16312 nsp_loss=0.01667 nsp_acc=99.431 throughput=139.0K tks/s lr=0.0000052 time=140.50 INFO:root:[step 948749] mlm_loss=1.62516 mlm_acc=65.27750 nsp_loss=0.01744 nsp_acc=99.378 throughput=147.0K tks/s lr=0.0000051 time=146.35 INFO:root:[step 948999] mlm_loss=1.45116 mlm_acc=68.79360 nsp_loss=0.01920 nsp_acc=99.331 throughput=140.0K tks/s lr=0.0000051 time=135.10 INFO:root:[step 949249] mlm_loss=1.68202 mlm_acc=64.97397 nsp_loss=0.03106 nsp_acc=98.824 throughput=139.0K tks/s lr=0.0000051 time=138.50 INFO:root:[step 949499] mlm_loss=1.37992 mlm_acc=68.36494 nsp_loss=0.02701 nsp_acc=99.060 throughput=120.0K tks/s lr=0.0000051 time=116.92 INFO:root:[step 949749] mlm_loss=1.40048 mlm_acc=66.84750 nsp_loss=0.03473 nsp_acc=98.791 throughput=139.0K tks/s lr=0.0000050 time=128.35 INFO:root:[step 949999] mlm_loss=1.56150 mlm_acc=65.86366 nsp_loss=0.01877 nsp_acc=99.352 throughput=150.0K tks/s lr=0.0000050 time=147.75 INFO:root:[step 949999] Saving checkpoints to /home/ubuntu/ckpt-master/0949999.params, /home/ubuntu/ckpt-master/0949999.states. INFO:root:[step 950249] mlm_loss=1.58309 mlm_acc=66.76706 nsp_loss=0.02025 nsp_acc=99.238 throughput=130.0K tks/s lr=0.0000050 time=169.02 INFO:root:[step 950499] mlm_loss=1.55481 mlm_acc=66.89023 nsp_loss=0.04892 nsp_acc=97.935 throughput=136.0K tks/s lr=0.0000050 time=139.74 INFO:root:[step 950749] mlm_loss=1.43722 mlm_acc=66.83698 nsp_loss=0.02911 nsp_acc=98.955 throughput=145.0K tks/s lr=0.0000049 time=124.78 INFO:root:[step 950999] mlm_loss=1.26884 mlm_acc=69.13013 nsp_loss=0.03108 nsp_acc=98.923 throughput=111.0K tks/s lr=0.0000049 time=120.89 INFO:root:[step 951249] mlm_loss=1.33795 mlm_acc=69.62575 nsp_loss=0.02441 nsp_acc=99.166 throughput=123.0K tks/s lr=0.0000049 time=106.72 INFO:root:[step 951499] mlm_loss=1.40151 mlm_acc=68.84486 nsp_loss=0.02103 nsp_acc=99.268 throughput=133.0K tks/s lr=0.0000049 time=116.35 INFO:root:[step 951749] mlm_loss=1.32032 mlm_acc=69.32019 nsp_loss=0.02594 nsp_acc=99.080 throughput=114.0K tks/s lr=0.0000048 time=119.46 INFO:root:[step 951999] mlm_loss=1.48207 mlm_acc=67.47721 nsp_loss=0.01714 nsp_acc=99.427 throughput=132.0K tks/s lr=0.0000048 time=129.38 INFO:root:[step 952249] mlm_loss=1.37322 mlm_acc=68.91029 nsp_loss=0.02372 nsp_acc=99.197 throughput=128.0K tks/s lr=0.0000048 time=114.83 INFO:root:[step 952499] mlm_loss=1.46720 mlm_acc=67.75029 nsp_loss=0.01773 nsp_acc=99.430 throughput=132.0K tks/s lr=0.0000048 time=128.35 INFO:root:[step 952749] mlm_loss=1.51503 mlm_acc=65.77025 nsp_loss=0.02516 nsp_acc=99.065 throughput=141.0K tks/s lr=0.0000047 time=137.25 INFO:root:[step 952999] mlm_loss=1.23319 mlm_acc=73.37491 nsp_loss=0.02459 nsp_acc=99.212 throughput=147.0K tks/s lr=0.0000047 time=147.64 INFO:root:[step 953249] mlm_loss=1.56166 mlm_acc=66.42244 nsp_loss=0.05371 nsp_acc=97.787 throughput=140.0K tks/s lr=0.0000047 time=139.66 INFO:root:[step 953499] mlm_loss=1.48725 mlm_acc=67.64265 nsp_loss=0.01708 nsp_acc=99.417 throughput=143.0K tks/s lr=0.0000047 time=123.11 INFO:root:[step 953749] mlm_loss=1.41374 mlm_acc=67.24804 nsp_loss=0.02464 nsp_acc=99.116 throughput=128.0K tks/s lr=0.0000046 time=125.80 INFO:root:[step 953999] mlm_loss=1.42844 mlm_acc=67.14859 nsp_loss=0.02330 nsp_acc=99.168 throughput=133.0K tks/s lr=0.0000046 time=133.42 INFO:root:[step 954249] mlm_loss=1.52458 mlm_acc=67.80722 nsp_loss=0.01385 nsp_acc=99.551 throughput=143.0K tks/s lr=0.0000046 time=139.69 INFO:root:[step 954499] mlm_loss=1.18784 mlm_acc=73.71475 nsp_loss=0.02629 nsp_acc=99.160 throughput=141.0K tks/s lr=0.0000046 time=128.90 INFO:root:[step 954749] mlm_loss=1.39863 mlm_acc=67.78934 nsp_loss=0.02532 nsp_acc=99.105 throughput=125.0K tks/s lr=0.0000045 time=121.14 INFO:root:[step 954999] mlm_loss=1.59037 mlm_acc=65.79412 nsp_loss=0.01804 nsp_acc=99.388 throughput=145.0K tks/s lr=0.0000045 time=144.29 INFO:root:[step 954999] Saving checkpoints to /home/ubuntu/ckpt-master/0954999.params, /home/ubuntu/ckpt-master/0954999.states. INFO:root:[step 955249] mlm_loss=1.47102 mlm_acc=66.45888 nsp_loss=0.03815 nsp_acc=98.538 throughput=126.0K tks/s lr=0.0000045 time=161.50 INFO:root:[step 955499] mlm_loss=1.46421 mlm_acc=65.53254 nsp_loss=0.05307 nsp_acc=97.928 throughput=137.0K tks/s lr=0.0000045 time=117.28 INFO:root:[step 955749] mlm_loss=1.42527 mlm_acc=68.15736 nsp_loss=0.01989 nsp_acc=99.308 throughput=128.0K tks/s lr=0.0000044 time=129.44 INFO:root:[step 955999] mlm_loss=1.15291 mlm_acc=70.97249 nsp_loss=0.03694 nsp_acc=98.683 throughput=106.0K tks/s lr=0.0000044 time=105.04 INFO:root:[step 956249] mlm_loss=1.39680 mlm_acc=66.90422 nsp_loss=0.02927 nsp_acc=98.962 throughput=139.0K tks/s lr=0.0000044 time=139.61 INFO:root:[step 956499] mlm_loss=1.55034 mlm_acc=66.01464 nsp_loss=0.01657 nsp_acc=99.437 throughput=145.0K tks/s lr=0.0000044 time=141.95 INFO:root:[step 956749] mlm_loss=1.70678 mlm_acc=63.74785 nsp_loss=0.04132 nsp_acc=98.411 throughput=156.0K tks/s lr=0.0000043 time=173.48 INFO:root:[step 956999] mlm_loss=1.63890 mlm_acc=65.33277 nsp_loss=0.02987 nsp_acc=98.825 throughput=153.0K tks/s lr=0.0000043 time=154.87 INFO:root:[step 957249] mlm_loss=1.45132 mlm_acc=67.23074 nsp_loss=0.02493 nsp_acc=99.089 throughput=131.0K tks/s lr=0.0000043 time=127.56 INFO:root:[step 957499] mlm_loss=1.36293 mlm_acc=68.26003 nsp_loss=0.02340 nsp_acc=99.202 throughput=133.0K tks/s lr=0.0000043 time=121.67 INFO:root:[step 957749] mlm_loss=1.42644 mlm_acc=67.82411 nsp_loss=0.02441 nsp_acc=99.179 throughput=137.0K tks/s lr=0.0000042 time=132.41 INFO:root:[step 957999] mlm_loss=1.51643 mlm_acc=67.08015 nsp_loss=0.01928 nsp_acc=99.311 throughput=144.0K tks/s lr=0.0000042 time=143.23 INFO:root:[step 958249] mlm_loss=1.45250 mlm_acc=67.01507 nsp_loss=0.02772 nsp_acc=98.974 throughput=140.0K tks/s lr=0.0000042 time=144.33 INFO:root:[step 958499] mlm_loss=1.32314 mlm_acc=69.48350 nsp_loss=0.03545 nsp_acc=98.688 throughput=118.0K tks/s lr=0.0000042 time=107.66 INFO:root:[step 958749] mlm_loss=1.29162 mlm_acc=69.52254 nsp_loss=0.03155 nsp_acc=98.868 throughput=112.0K tks/s lr=0.0000041 time=116.86 INFO:root:[step 958999] mlm_loss=1.39834 mlm_acc=67.19355 nsp_loss=0.02495 nsp_acc=99.133 throughput=142.0K tks/s lr=0.0000041 time=124.33 INFO:root:[step 959249] mlm_loss=1.46898 mlm_acc=67.38111 nsp_loss=0.01913 nsp_acc=99.343 throughput=135.0K tks/s lr=0.0000041 time=134.52 INFO:root:[step 959499] mlm_loss=1.38880 mlm_acc=68.58208 nsp_loss=0.02498 nsp_acc=99.167 throughput=124.0K tks/s lr=0.0000041 time=126.46 INFO:root:[step 959749] mlm_loss=1.41990 mlm_acc=65.69819 nsp_loss=0.03531 nsp_acc=98.761 throughput=136.0K tks/s lr=0.0000040 time=134.15 INFO:root:[step 959999] mlm_loss=1.53422 mlm_acc=66.73232 nsp_loss=0.02614 nsp_acc=99.042 throughput=157.0K tks/s lr=0.0000040 time=156.95 INFO:root:[step 959999] Saving checkpoints to /home/ubuntu/ckpt-master/0959999.params, /home/ubuntu/ckpt-master/0959999.states. INFO:root:[step 960249] mlm_loss=1.52570 mlm_acc=66.95772 nsp_loss=0.02397 nsp_acc=99.163 throughput=129.0K tks/s lr=0.0000040 time=159.47 INFO:root:[step 960499] mlm_loss=1.24429 mlm_acc=70.55238 nsp_loss=0.03133 nsp_acc=98.919 throughput=120.0K tks/s lr=0.0000040 time=107.65 INFO:root:[step 960749] mlm_loss=1.32769 mlm_acc=69.57325 nsp_loss=0.02383 nsp_acc=99.209 throughput=121.0K tks/s lr=0.0000039 time=117.90 INFO:root:[step 960999] mlm_loss=1.64766 mlm_acc=66.25714 nsp_loss=0.02568 nsp_acc=99.033 throughput=143.0K tks/s lr=0.0000039 time=149.82 INFO:root:[step 961249] mlm_loss=1.83715 mlm_acc=62.71073 nsp_loss=0.03372 nsp_acc=98.739 throughput=151.0K tks/s lr=0.0000039 time=151.38 INFO:root:[step 961499] mlm_loss=1.52915 mlm_acc=66.73788 nsp_loss=0.01978 nsp_acc=99.327 throughput=141.0K tks/s lr=0.0000039 time=139.12 INFO:root:[step 961749] mlm_loss=1.42847 mlm_acc=67.00133 nsp_loss=0.02823 nsp_acc=98.959 throughput=131.0K tks/s lr=0.0000038 time=129.44 INFO:root:[step 961999] mlm_loss=1.47169 mlm_acc=66.99139 nsp_loss=0.02821 nsp_acc=98.965 throughput=143.0K tks/s lr=0.0000038 time=129.70 INFO:root:[step 962249] mlm_loss=1.31865 mlm_acc=69.58872 nsp_loss=0.02447 nsp_acc=99.158 throughput=111.0K tks/s lr=0.0000038 time=118.61 INFO:root:[step 962499] mlm_loss=1.28316 mlm_acc=69.85811 nsp_loss=0.02783 nsp_acc=99.029 throughput=120.0K tks/s lr=0.0000038 time=106.42 INFO:root:[step 962749] mlm_loss=1.26411 mlm_acc=69.74006 nsp_loss=0.02760 nsp_acc=99.061 throughput=119.0K tks/s lr=0.0000037 time=107.08 INFO:root:[step 962999] mlm_loss=1.36622 mlm_acc=68.83512 nsp_loss=0.02266 nsp_acc=99.215 throughput=120.0K tks/s lr=0.0000037 time=119.76 INFO:root:[step 963249] mlm_loss=1.36880 mlm_acc=68.91633 nsp_loss=0.02437 nsp_acc=99.150 throughput=129.0K tks/s lr=0.0000037 time=112.69 INFO:root:[step 963499] mlm_loss=1.50304 mlm_acc=67.65549 nsp_loss=0.01775 nsp_acc=99.374 throughput=133.0K tks/s lr=0.0000037 time=131.93 INFO:root:[step 963749] mlm_loss=1.48498 mlm_acc=67.98346 nsp_loss=0.01603 nsp_acc=99.451 throughput=132.0K tks/s lr=0.0000036 time=131.35 INFO:root:[step 963999] mlm_loss=1.35614 mlm_acc=67.79279 nsp_loss=0.02739 nsp_acc=99.027 throughput=146.0K tks/s lr=0.0000036 time=127.00 INFO:root:[step 964249] mlm_loss=1.52699 mlm_acc=67.39267 nsp_loss=0.01359 nsp_acc=99.554 throughput=141.0K tks/s lr=0.0000036 time=137.19 INFO:root:[step 964499] mlm_loss=1.39997 mlm_acc=69.00204 nsp_loss=0.02327 nsp_acc=99.167 throughput=122.0K tks/s lr=0.0000036 time=123.42 INFO:root:[step 964749] mlm_loss=1.42530 mlm_acc=68.67412 nsp_loss=0.01968 nsp_acc=99.307 throughput=123.0K tks/s lr=0.0000035 time=127.40 INFO:root:[step 964999] mlm_loss=1.39387 mlm_acc=68.44521 nsp_loss=0.02036 nsp_acc=99.304 throughput=136.0K tks/s lr=0.0000035 time=116.43 INFO:root:[step 964999] Saving checkpoints to /home/ubuntu/ckpt-master/0964999.params, /home/ubuntu/ckpt-master/0964999.states. INFO:root:[step 965249] mlm_loss=1.56901 mlm_acc=66.23951 nsp_loss=0.02294 nsp_acc=99.173 throughput=130.0K tks/s lr=0.0000035 time=155.37 INFO:root:[step 965499] mlm_loss=1.58792 mlm_acc=66.44115 nsp_loss=0.01785 nsp_acc=99.366 throughput=146.0K tks/s lr=0.0000035 time=143.22 INFO:root:[step 965749] mlm_loss=1.56073 mlm_acc=65.78851 nsp_loss=0.05724 nsp_acc=97.614 throughput=143.0K tks/s lr=0.0000034 time=148.97 INFO:root:[step 965999] mlm_loss=1.55168 mlm_acc=66.31303 nsp_loss=0.05478 nsp_acc=97.640 throughput=140.0K tks/s lr=0.0000034 time=142.08 INFO:root:[step 966249] mlm_loss=1.25910 mlm_acc=69.83039 nsp_loss=0.03133 nsp_acc=98.897 throughput=110.0K tks/s lr=0.0000034 time=118.41 INFO:root:[step 966499] mlm_loss=1.40832 mlm_acc=68.49988 nsp_loss=0.02318 nsp_acc=99.182 throughput=130.0K tks/s lr=0.0000034 time=111.87 INFO:root:[step 966749] mlm_loss=1.44422 mlm_acc=68.19617 nsp_loss=0.02097 nsp_acc=99.271 throughput=125.0K tks/s lr=0.0000033 time=123.43 INFO:root:[step 966999] mlm_loss=1.29016 mlm_acc=69.63392 nsp_loss=0.02655 nsp_acc=99.063 throughput=118.0K tks/s lr=0.0000033 time=106.86 INFO:root:[step 967249] mlm_loss=1.48696 mlm_acc=68.02156 nsp_loss=0.01754 nsp_acc=99.420 throughput=139.0K tks/s lr=0.0000033 time=121.71 INFO:root:[step 967499] mlm_loss=1.29123 mlm_acc=69.75039 nsp_loss=0.02741 nsp_acc=99.051 throughput=107.0K tks/s lr=0.0000033 time=116.96 INFO:root:[step 967749] mlm_loss=1.30713 mlm_acc=69.60299 nsp_loss=0.02794 nsp_acc=99.076 throughput=120.0K tks/s lr=0.0000032 time=113.24 INFO:root:[step 967999] mlm_loss=1.50680 mlm_acc=66.61099 nsp_loss=0.02799 nsp_acc=98.959 throughput=137.0K tks/s lr=0.0000032 time=130.90 INFO:root:[step 968249] mlm_loss=1.46217 mlm_acc=66.74587 nsp_loss=0.03257 nsp_acc=98.772 throughput=124.0K tks/s lr=0.0000032 time=128.73 INFO:root:[step 968499] mlm_loss=1.38610 mlm_acc=68.45999 nsp_loss=0.02291 nsp_acc=99.190 throughput=134.0K tks/s lr=0.0000032 time=115.21 INFO:root:[step 968749] mlm_loss=1.56733 mlm_acc=66.37696 nsp_loss=0.01798 nsp_acc=99.338 throughput=145.0K tks/s lr=0.0000031 time=141.92 INFO:root:[step 968999] mlm_loss=1.47211 mlm_acc=67.37669 nsp_loss=0.02255 nsp_acc=99.188 throughput=131.0K tks/s lr=0.0000031 time=129.13 INFO:root:[step 969249] mlm_loss=1.35567 mlm_acc=68.87024 nsp_loss=0.02139 nsp_acc=99.282 throughput=131.0K tks/s lr=0.0000031 time=116.27 INFO:root:[step 969499] mlm_loss=1.29208 mlm_acc=69.76413 nsp_loss=0.02626 nsp_acc=99.087 throughput=112.0K tks/s lr=0.0000031 time=114.27 INFO:root:[step 969749] mlm_loss=1.41538 mlm_acc=68.53143 nsp_loss=0.01983 nsp_acc=99.335 throughput=131.0K tks/s lr=0.0000030 time=117.62 INFO:root:[step 969999] mlm_loss=1.44800 mlm_acc=67.48565 nsp_loss=0.01838 nsp_acc=99.389 throughput=133.0K tks/s lr=0.0000030 time=130.82 INFO:root:[step 969999] Saving checkpoints to /home/ubuntu/ckpt-master/0969999.params, /home/ubuntu/ckpt-master/0969999.states. INFO:root:[step 970249] mlm_loss=1.42020 mlm_acc=68.54597 nsp_loss=0.02023 nsp_acc=99.296 throughput=110.0K tks/s lr=0.0000030 time=140.30 INFO:root:[step 970499] mlm_loss=1.11804 mlm_acc=70.68365 nsp_loss=0.04018 nsp_acc=98.587 throughput=109.0K tks/s lr=0.0000030 time=103.16 INFO:root:[step 970749] mlm_loss=1.43790 mlm_acc=67.05551 nsp_loss=0.02580 nsp_acc=99.060 throughput=141.0K tks/s lr=0.0000029 time=132.12 INFO:root:[step 970999] mlm_loss=1.39839 mlm_acc=66.80112 nsp_loss=0.02353 nsp_acc=99.192 throughput=125.0K tks/s lr=0.0000029 time=126.55 INFO:root:[step 971249] mlm_loss=1.53658 mlm_acc=65.49384 nsp_loss=0.02531 nsp_acc=99.131 throughput=137.0K tks/s lr=0.0000029 time=135.13 INFO:root:[step 971499] mlm_loss=1.44683 mlm_acc=66.84780 nsp_loss=0.02866 nsp_acc=99.020 throughput=135.0K tks/s lr=0.0000029 time=119.75 INFO:root:[step 971749] mlm_loss=1.45100 mlm_acc=67.09535 nsp_loss=0.02836 nsp_acc=99.025 throughput=140.0K tks/s lr=0.0000028 time=140.25 INFO:root:[step 971999] mlm_loss=1.53641 mlm_acc=67.43676 nsp_loss=0.01383 nsp_acc=99.525 throughput=140.0K tks/s lr=0.0000028 time=134.34 INFO:root:[step 972249] mlm_loss=1.27114 mlm_acc=69.46421 nsp_loss=0.02962 nsp_acc=98.941 throughput=115.0K tks/s lr=0.0000028 time=117.33 INFO:root:[step 972499] mlm_loss=1.51584 mlm_acc=67.47516 nsp_loss=0.01490 nsp_acc=99.508 throughput=140.0K tks/s lr=0.0000028 time=133.48 INFO:root:[step 972749] mlm_loss=1.46028 mlm_acc=67.51705 nsp_loss=0.01618 nsp_acc=99.446 throughput=140.0K tks/s lr=0.0000027 time=127.51 INFO:root:[step 972999] mlm_loss=1.53836 mlm_acc=67.22152 nsp_loss=0.01570 nsp_acc=99.462 throughput=140.0K tks/s lr=0.0000027 time=135.60 INFO:root:[step 973249] mlm_loss=1.50641 mlm_acc=66.34690 nsp_loss=0.02831 nsp_acc=98.934 throughput=141.0K tks/s lr=0.0000027 time=141.38 INFO:root:[step 973499] mlm_loss=1.43013 mlm_acc=67.96989 nsp_loss=0.02367 nsp_acc=99.160 throughput=126.0K tks/s lr=0.0000027 time=128.06 INFO:root:[step 973749] mlm_loss=1.37674 mlm_acc=67.64221 nsp_loss=0.02822 nsp_acc=98.953 throughput=134.0K tks/s lr=0.0000026 time=135.40 INFO:root:[step 973999] mlm_loss=1.56168 mlm_acc=65.56636 nsp_loss=0.03800 nsp_acc=98.553 throughput=129.0K tks/s lr=0.0000026 time=133.26 INFO:root:[step 974249] mlm_loss=1.36007 mlm_acc=67.83174 nsp_loss=0.02851 nsp_acc=98.992 throughput=139.0K tks/s lr=0.0000026 time=118.09 INFO:root:[step 974499] mlm_loss=1.59159 mlm_acc=65.48615 nsp_loss=0.02194 nsp_acc=99.193 throughput=146.0K tks/s lr=0.0000026 time=144.42 INFO:root:[step 974749] mlm_loss=1.35162 mlm_acc=67.94094 nsp_loss=0.02660 nsp_acc=99.024 throughput=118.0K tks/s lr=0.0000025 time=124.30 INFO:root:[step 974999] mlm_loss=1.25294 mlm_acc=69.90413 nsp_loss=0.03015 nsp_acc=98.947 throughput=121.0K tks/s lr=0.0000025 time=110.59 INFO:root:[step 974999] Saving checkpoints to /home/ubuntu/ckpt-master/0974999.params, /home/ubuntu/ckpt-master/0974999.states. INFO:root:[step 975249] mlm_loss=1.36908 mlm_acc=68.23347 nsp_loss=0.02641 nsp_acc=99.067 throughput=111.0K tks/s lr=0.0000025 time=140.90 INFO:root:[step 975499] mlm_loss=1.30807 mlm_acc=69.57254 nsp_loss=0.02835 nsp_acc=99.013 throughput=120.0K tks/s lr=0.0000025 time=110.37 INFO:root:[step 975749] mlm_loss=1.26512 mlm_acc=69.95506 nsp_loss=0.02966 nsp_acc=98.971 throughput=117.0K tks/s lr=0.0000024 time=107.24 INFO:root:[step 975999] mlm_loss=1.57416 mlm_acc=64.93887 nsp_loss=0.02791 nsp_acc=98.981 throughput=144.0K tks/s lr=0.0000024 time=141.23 INFO:root:[step 976249] mlm_loss=1.44594 mlm_acc=68.16216 nsp_loss=0.01954 nsp_acc=99.335 throughput=128.0K tks/s lr=0.0000024 time=128.64 INFO:root:[step 976499] mlm_loss=1.35462 mlm_acc=69.34203 nsp_loss=0.02267 nsp_acc=99.209 throughput=132.0K tks/s lr=0.0000024 time=112.33 INFO:root:[step 976749] mlm_loss=1.40081 mlm_acc=68.66089 nsp_loss=0.02344 nsp_acc=99.192 throughput=118.0K tks/s lr=0.0000023 time=123.23 INFO:root:[step 976999] mlm_loss=1.56171 mlm_acc=65.20449 nsp_loss=0.03661 nsp_acc=98.631 throughput=134.0K tks/s lr=0.0000023 time=134.58 INFO:root:[step 977249] mlm_loss=1.37898 mlm_acc=68.84744 nsp_loss=0.02087 nsp_acc=99.297 throughput=133.0K tks/s lr=0.0000023 time=115.12 INFO:root:[step 977499] mlm_loss=1.59344 mlm_acc=65.61834 nsp_loss=0.02417 nsp_acc=99.046 throughput=149.0K tks/s lr=0.0000023 time=148.48 INFO:root:[step 977749] mlm_loss=1.43821 mlm_acc=68.35827 nsp_loss=0.02030 nsp_acc=99.307 throughput=122.0K tks/s lr=0.0000022 time=125.22 INFO:root:[step 977999] mlm_loss=1.31654 mlm_acc=69.67483 nsp_loss=0.02633 nsp_acc=99.064 throughput=119.0K tks/s lr=0.0000022 time=106.03 INFO:root:[step 978249] mlm_loss=1.58322 mlm_acc=65.27603 nsp_loss=0.06633 nsp_acc=97.316 throughput=148.0K tks/s lr=0.0000022 time=144.59 INFO:root:[step 978499] mlm_loss=1.41356 mlm_acc=67.41999 nsp_loss=0.03330 nsp_acc=98.763 throughput=128.0K tks/s lr=0.0000022 time=127.03 INFO:root:[step 978749] mlm_loss=1.50198 mlm_acc=66.90627 nsp_loss=0.02370 nsp_acc=99.116 throughput=143.0K tks/s lr=0.0000021 time=145.78 INFO:root:[step 978999] mlm_loss=1.48392 mlm_acc=67.27225 nsp_loss=0.02401 nsp_acc=99.132 throughput=145.0K tks/s lr=0.0000021 time=139.20 INFO:root:[step 979249] mlm_loss=1.34801 mlm_acc=68.40884 nsp_loss=0.03198 nsp_acc=98.866 throughput=131.0K tks/s lr=0.0000021 time=131.28 INFO:root:[step 979499] mlm_loss=1.45600 mlm_acc=66.43512 nsp_loss=0.03425 nsp_acc=98.744 throughput=141.0K tks/s lr=0.0000021 time=134.02 INFO:root:[step 979749] mlm_loss=1.55071 mlm_acc=65.40490 nsp_loss=0.01887 nsp_acc=99.346 throughput=143.0K tks/s lr=0.0000020 time=142.94 INFO:root:[step 979999] mlm_loss=1.38257 mlm_acc=68.05041 nsp_loss=0.03513 nsp_acc=98.696 throughput=123.0K tks/s lr=0.0000020 time=124.13 INFO:root:[step 979999] Saving checkpoints to /home/ubuntu/ckpt-master/0979999.params, /home/ubuntu/ckpt-master/0979999.states. INFO:root:[step 980249] mlm_loss=1.38059 mlm_acc=67.82462 nsp_loss=0.04405 nsp_acc=98.249 throughput=120.0K tks/s lr=0.0000020 time=133.69 INFO:root:[step 980499] mlm_loss=1.47553 mlm_acc=67.93669 nsp_loss=0.01785 nsp_acc=99.377 throughput=130.0K tks/s lr=0.0000020 time=130.82 INFO:root:[step 980749] mlm_loss=1.61982 mlm_acc=65.06777 nsp_loss=0.03686 nsp_acc=98.588 throughput=153.0K tks/s lr=0.0000019 time=152.30 INFO:root:[step 980999] mlm_loss=1.54373 mlm_acc=65.38605 nsp_loss=0.03809 nsp_acc=98.592 throughput=133.0K tks/s lr=0.0000019 time=136.23 INFO:root:[step 981249] mlm_loss=1.30213 mlm_acc=69.86177 nsp_loss=0.02599 nsp_acc=99.120 throughput=116.0K tks/s lr=0.0000019 time=108.00 INFO:root:[step 981499] mlm_loss=1.58199 mlm_acc=65.67098 nsp_loss=0.01620 nsp_acc=99.449 throughput=141.0K tks/s lr=0.0000019 time=158.60 INFO:root:[step 981749] mlm_loss=1.47086 mlm_acc=65.90145 nsp_loss=0.02232 nsp_acc=99.207 throughput=142.0K tks/s lr=0.0000018 time=124.47 INFO:root:[step 981999] mlm_loss=1.42651 mlm_acc=67.90007 nsp_loss=0.01928 nsp_acc=99.360 throughput=131.0K tks/s lr=0.0000018 time=129.25 INFO:root:[step 982249] mlm_loss=1.47432 mlm_acc=67.76901 nsp_loss=0.02002 nsp_acc=99.296 throughput=129.0K tks/s lr=0.0000018 time=132.29 INFO:root:[step 982499] mlm_loss=1.33127 mlm_acc=69.13683 nsp_loss=0.02620 nsp_acc=99.095 throughput=125.0K tks/s lr=0.0000018 time=109.42 INFO:root:[step 982749] mlm_loss=1.50620 mlm_acc=66.86269 nsp_loss=0.02155 nsp_acc=99.253 throughput=147.0K tks/s lr=0.0000017 time=142.85 INFO:root:[step 982999] mlm_loss=1.35701 mlm_acc=71.03074 nsp_loss=0.02273 nsp_acc=99.206 throughput=137.0K tks/s lr=0.0000017 time=134.65 INFO:root:[step 983249] mlm_loss=1.48205 mlm_acc=68.27065 nsp_loss=0.03071 nsp_acc=98.920 throughput=148.0K tks/s lr=0.0000017 time=149.99 INFO:root:[step 983499] mlm_loss=1.48511 mlm_acc=67.32488 nsp_loss=0.03895 nsp_acc=98.400 throughput=142.0K tks/s lr=0.0000017 time=141.35 INFO:root:[step 983749] mlm_loss=1.50434 mlm_acc=67.24781 nsp_loss=0.01924 nsp_acc=99.324 throughput=140.0K tks/s lr=0.0000016 time=135.49 INFO:root:[step 983999] mlm_loss=1.12353 mlm_acc=73.98446 nsp_loss=0.02999 nsp_acc=99.025 throughput=144.0K tks/s lr=0.0000016 time=150.01 INFO:root:[step 984249] mlm_loss=1.52386 mlm_acc=66.67431 nsp_loss=0.06946 nsp_acc=97.084 throughput=138.0K tks/s lr=0.0000016 time=124.87 INFO:root:[step 984499] mlm_loss=1.53833 mlm_acc=67.09944 nsp_loss=0.01578 nsp_acc=99.427 throughput=138.0K tks/s lr=0.0000016 time=148.87 INFO:root:[step 984749] mlm_loss=1.29067 mlm_acc=69.65319 nsp_loss=0.02434 nsp_acc=99.190 throughput=123.0K tks/s lr=0.0000015 time=109.82 INFO:root:[step 984999] mlm_loss=1.35689 mlm_acc=69.29753 nsp_loss=0.02181 nsp_acc=99.276 throughput=133.0K tks/s lr=0.0000015 time=115.11 INFO:root:[step 984999] Saving checkpoints to /home/ubuntu/ckpt-master/0984999.params, /home/ubuntu/ckpt-master/0984999.states. INFO:root:[step 985249] mlm_loss=1.16404 mlm_acc=70.63366 nsp_loss=0.04206 nsp_acc=98.502 throughput=95.0K tks/s lr=0.0000015 time=132.54 INFO:root:[step 985499] mlm_loss=1.32045 mlm_acc=69.45615 nsp_loss=0.02650 nsp_acc=99.103 throughput=122.0K tks/s lr=0.0000015 time=111.56 INFO:root:[step 985749] mlm_loss=1.50964 mlm_acc=66.00401 nsp_loss=0.02836 nsp_acc=98.958 throughput=154.0K tks/s lr=0.0000014 time=154.38 INFO:root:[step 985999] mlm_loss=1.47186 mlm_acc=67.50102 nsp_loss=0.01786 nsp_acc=99.385 throughput=135.0K tks/s lr=0.0000014 time=134.65 INFO:root:[step 986249] mlm_loss=1.55271 mlm_acc=66.25172 nsp_loss=0.05770 nsp_acc=97.742 throughput=152.0K tks/s lr=0.0000014 time=153.30 INFO:root:[step 986499] mlm_loss=1.37344 mlm_acc=68.77615 nsp_loss=0.02839 nsp_acc=98.971 throughput=118.0K tks/s lr=0.0000014 time=121.36 INFO:root:[step 986749] mlm_loss=1.49635 mlm_acc=66.97471 nsp_loss=0.04890 nsp_acc=98.042 throughput=141.0K tks/s lr=0.0000013 time=143.50 INFO:root:[step 986999] mlm_loss=1.45627 mlm_acc=68.28986 nsp_loss=0.02066 nsp_acc=99.313 throughput=136.0K tks/s lr=0.0000013 time=118.28 INFO:root:[step 987249] mlm_loss=1.33982 mlm_acc=69.27030 nsp_loss=0.02462 nsp_acc=99.136 throughput=116.0K tks/s lr=0.0000013 time=120.22 INFO:root:[step 987499] mlm_loss=1.49992 mlm_acc=66.12452 nsp_loss=0.04370 nsp_acc=98.379 throughput=125.0K tks/s lr=0.0000013 time=112.97 INFO:root:[step 987749] mlm_loss=1.66938 mlm_acc=65.10115 nsp_loss=0.03489 nsp_acc=98.590 throughput=150.0K tks/s lr=0.0000012 time=150.38 INFO:root:[step 987999] mlm_loss=1.35158 mlm_acc=68.58562 nsp_loss=0.02713 nsp_acc=99.049 throughput=122.0K tks/s lr=0.0000012 time=122.80 INFO:root:[step 988249] mlm_loss=1.45393 mlm_acc=68.29224 nsp_loss=0.01783 nsp_acc=99.404 throughput=137.0K tks/s lr=0.0000012 time=119.58 INFO:root:[step 988499] mlm_loss=1.52875 mlm_acc=66.34628 nsp_loss=0.04378 nsp_acc=98.291 throughput=136.0K tks/s lr=0.0000012 time=138.45 INFO:root:[step 988749] mlm_loss=1.43751 mlm_acc=68.10694 nsp_loss=0.02140 nsp_acc=99.212 throughput=127.0K tks/s lr=0.0000011 time=127.32 INFO:root:[step 988999] mlm_loss=1.47411 mlm_acc=66.19986 nsp_loss=0.05072 nsp_acc=98.002 throughput=135.0K tks/s lr=0.0000011 time=130.94 INFO:root:[step 989249] mlm_loss=1.51373 mlm_acc=67.17327 nsp_loss=0.03756 nsp_acc=98.554 throughput=149.0K tks/s lr=0.0000011 time=147.28 INFO:root:[step 989499] mlm_loss=1.54913 mlm_acc=66.75342 nsp_loss=0.04063 nsp_acc=98.350 throughput=143.0K tks/s lr=0.0000011 time=143.50 INFO:root:[step 989749] mlm_loss=1.41824 mlm_acc=67.44232 nsp_loss=0.05697 nsp_acc=97.734 throughput=135.0K tks/s lr=0.0000010 time=127.81 INFO:root:[step 989999] mlm_loss=1.29639 mlm_acc=69.79397 nsp_loss=0.02683 nsp_acc=99.056 throughput=118.0K tks/s lr=0.0000010 time=107.29 INFO:root:[step 989999] Saving checkpoints to /home/ubuntu/ckpt-master/0989999.params, /home/ubuntu/ckpt-master/0989999.states. INFO:root:[step 990249] mlm_loss=1.52819 mlm_acc=67.49112 nsp_loss=0.01427 nsp_acc=99.505 throughput=125.0K tks/s lr=0.0000010 time=149.63 INFO:root:[step 990499] mlm_loss=1.32129 mlm_acc=69.51885 nsp_loss=0.02377 nsp_acc=99.188 throughput=120.0K tks/s lr=0.0000010 time=119.95 INFO:root:[step 990749] mlm_loss=1.38559 mlm_acc=68.85526 nsp_loss=0.02327 nsp_acc=99.197 throughput=131.0K tks/s lr=0.0000009 time=114.33 INFO:root:[step 990999] mlm_loss=1.29003 mlm_acc=69.87850 nsp_loss=0.02827 nsp_acc=99.022 throughput=111.0K tks/s lr=0.0000009 time=117.63 INFO:root:[step 991249] mlm_loss=1.36867 mlm_acc=68.96705 nsp_loss=0.02174 nsp_acc=99.265 throughput=131.0K tks/s lr=0.0000009 time=116.98 INFO:root:[step 991499] mlm_loss=1.55425 mlm_acc=65.73864 nsp_loss=0.02488 nsp_acc=99.084 throughput=139.0K tks/s lr=0.0000009 time=141.67 INFO:root:[step 991749] mlm_loss=1.36209 mlm_acc=69.44888 nsp_loss=0.02462 nsp_acc=99.171 throughput=129.0K tks/s lr=0.0000008 time=110.92 INFO:root:[step 991999] mlm_loss=1.47472 mlm_acc=68.11917 nsp_loss=0.01707 nsp_acc=99.435 throughput=130.0K tks/s lr=0.0000008 time=127.25 INFO:root:[step 992249] mlm_loss=1.29620 mlm_acc=69.08030 nsp_loss=0.03949 nsp_acc=98.535 throughput=119.0K tks/s lr=0.0000008 time=110.67 INFO:root:[step 992499] mlm_loss=1.40548 mlm_acc=68.35761 nsp_loss=0.02298 nsp_acc=99.223 throughput=124.0K tks/s lr=0.0000008 time=125.59 INFO:root:[step 992749] mlm_loss=1.30871 mlm_acc=69.37726 nsp_loss=0.02919 nsp_acc=98.949 throughput=121.0K tks/s lr=0.0000007 time=108.98 INFO:root:[step 992999] mlm_loss=1.29727 mlm_acc=69.84283 nsp_loss=0.02870 nsp_acc=98.999 throughput=113.0K tks/s lr=0.0000007 time=116.40 INFO:root:[step 993249] mlm_loss=1.53267 mlm_acc=66.23101 nsp_loss=0.02542 nsp_acc=99.030 throughput=146.0K tks/s lr=0.0000007 time=142.27 INFO:root:[step 993499] mlm_loss=1.45358 mlm_acc=67.90776 nsp_loss=0.01796 nsp_acc=99.397 throughput=139.0K tks/s lr=0.0000007 time=120.97 INFO:root:[step 993749] mlm_loss=1.69949 mlm_acc=63.80202 nsp_loss=0.04237 nsp_acc=98.361 throughput=144.0K tks/s lr=0.0000006 time=158.87 INFO:root:[step 993999] mlm_loss=1.36981 mlm_acc=68.26362 nsp_loss=0.04396 nsp_acc=98.297 throughput=131.0K tks/s lr=0.0000006 time=114.78 INFO:root:[step 994249] mlm_loss=1.42598 mlm_acc=67.47303 nsp_loss=0.04462 nsp_acc=98.244 throughput=126.0K tks/s lr=0.0000006 time=125.55 INFO:root:[step 994499] mlm_loss=1.66224 mlm_acc=63.98943 nsp_loss=0.04268 nsp_acc=98.238 throughput=148.0K tks/s lr=0.0000006 time=159.10 INFO:root:[step 994749] mlm_loss=1.38542 mlm_acc=69.13597 nsp_loss=0.02122 nsp_acc=99.291 throughput=128.0K tks/s lr=0.0000005 time=116.07 INFO:root:[step 994999] mlm_loss=1.54649 mlm_acc=66.61795 nsp_loss=0.01555 nsp_acc=99.465 throughput=145.0K tks/s lr=0.0000005 time=143.42 INFO:root:[step 994999] Saving checkpoints to /home/ubuntu/ckpt-master/0994999.params, /home/ubuntu/ckpt-master/0994999.states. INFO:root:[step 995249] mlm_loss=1.31112 mlm_acc=68.83475 nsp_loss=0.02705 nsp_acc=99.073 throughput=102.0K tks/s lr=0.0000005 time=135.79 INFO:root:[step 995499] mlm_loss=1.32370 mlm_acc=69.49292 nsp_loss=0.02319 nsp_acc=99.209 throughput=122.0K tks/s lr=0.0000005 time=111.06 INFO:root:[step 995749] mlm_loss=1.50054 mlm_acc=66.51361 nsp_loss=0.01602 nsp_acc=99.428 throughput=146.0K tks/s lr=0.0000004 time=137.79 INFO:root:[step 995999] mlm_loss=1.39759 mlm_acc=68.27988 nsp_loss=0.02194 nsp_acc=99.246 throughput=137.0K tks/s lr=0.0000004 time=139.79 INFO:root:[step 996249] mlm_loss=1.31050 mlm_acc=69.86175 nsp_loss=0.02323 nsp_acc=99.236 throughput=129.0K tks/s lr=0.0000004 time=114.26 INFO:root:[step 996499] mlm_loss=1.39932 mlm_acc=67.60319 nsp_loss=0.03167 nsp_acc=98.841 throughput=137.0K tks/s lr=0.0000004 time=139.97 INFO:root:[step 996749] mlm_loss=1.41729 mlm_acc=67.68039 nsp_loss=0.02710 nsp_acc=99.056 throughput=128.0K tks/s lr=0.0000003 time=124.88 INFO:root:[step 996999] mlm_loss=1.59845 mlm_acc=65.25389 nsp_loss=0.03005 nsp_acc=98.846 throughput=145.0K tks/s lr=0.0000003 time=144.06 INFO:root:[step 997249] mlm_loss=1.64554 mlm_acc=64.05605 nsp_loss=0.02088 nsp_acc=99.222 throughput=145.0K tks/s lr=0.0000003 time=149.00 INFO:root:[step 997499] mlm_loss=1.36433 mlm_acc=68.95945 nsp_loss=0.02352 nsp_acc=99.178 throughput=129.0K tks/s lr=0.0000003 time=113.36 INFO:root:[step 997749] mlm_loss=1.30665 mlm_acc=69.47565 nsp_loss=0.02656 nsp_acc=99.061 throughput=112.0K tks/s lr=0.0000002 time=118.45 INFO:root:[step 997999] mlm_loss=1.36029 mlm_acc=68.76620 nsp_loss=0.02137 nsp_acc=99.267 throughput=135.0K tks/s lr=0.0000002 time=115.11 INFO:root:[step 998249] mlm_loss=1.49108 mlm_acc=65.88094 nsp_loss=0.02254 nsp_acc=99.199 throughput=141.0K tks/s lr=0.0000002 time=142.89 INFO:root:[step 998499] mlm_loss=1.58603 mlm_acc=66.12388 nsp_loss=0.03801 nsp_acc=98.539 throughput=141.0K tks/s lr=0.0000002 time=138.58 INFO:root:[step 998749] mlm_loss=1.37717 mlm_acc=68.37585 nsp_loss=0.03292 nsp_acc=98.748 throughput=121.0K tks/s lr=0.0000001 time=122.31 INFO:root:[step 998999] mlm_loss=1.55122 mlm_acc=66.63549 nsp_loss=0.05399 nsp_acc=97.793 throughput=147.0K tks/s lr=0.0000001 time=128.93 INFO:root:[step 999249] mlm_loss=1.51335 mlm_acc=67.17422 nsp_loss=0.03037 nsp_acc=98.818 throughput=142.0K tks/s lr=0.0000001 time=160.64 INFO:root:[step 999499] mlm_loss=1.22902 mlm_acc=70.05235 nsp_loss=0.03315 nsp_acc=98.822 throughput=117.0K tks/s lr=0.0000001 time=108.89 INFO:root:[step 999749] mlm_loss=1.12276 mlm_acc=70.98081 nsp_loss=0.04028 nsp_acc=98.574 throughput=113.0K tks/s lr=0.0000000 time=104.09 INFO:root:[step 999999] mlm_loss=1.38571 mlm_acc=68.25514 nsp_loss=0.02520 nsp_acc=99.118 throughput=133.0K tks/s lr=0.0000000 time=126.00 INFO:root:[step 999999] Saving checkpoints to /home/ubuntu/ckpt-master/0999999.params, /home/ubuntu/ckpt-master/0999999.states.