loaded library: /usr/lib/x86_64-linux-gnu/libibverbs.so.1 ***************************************** Setting OMP_NUM_THREADS environment variable for each process to be 1 in default, to avoid your system being overloaded, please further tune the variable for optimal performance in your application as needed. ***************************************** loaded library: loaded library: loaded library: loaded library: /usr/lib/x86_64-linux-gnu/libibverbs.so.1/usr/lib/x86_64-linux-gnu/libibverbs.so.1/usr/lib/x86_64-linux-gnu/libibverbs.so.1 /usr/lib/x86_64-linux-gnu/libibverbs.so.1 loaded library: /usr/lib/x86_64-linux-gnu/libibverbs.so.1 loaded library: loaded library: /usr/lib/x86_64-linux-gnu/libibverbs.so.1/usr/lib/x86_64-linux-gnu/libibverbs.so.1 loaded library: /usr/lib/x86_64-linux-gnu/libibverbs.so.1 W20220403 06:26:11.131686 2307 rpc_client.cpp:190] LoadServer 10.7.139.219 Failed at 0 times error_code 14 error_message failed to connect to all addresses ------------------------ arguments ------------------------ batches_per_epoch ............................... 834 channel_last .................................... False ddp ............................................. True exit_num ........................................ -1 fuse_bn_add_relu ................................ False fuse_bn_relu .................................... False gpu_stat_file ................................... None grad_clipping ................................... 0.0 graph ........................................... False label_smoothing ................................. 0.1 learning_rate ................................... 1.536 legacy_init ..................................... False load_path ....................................... None lr_decay_type ................................... cosine metric_local .................................... True metric_train_acc ................................ True momentum ........................................ 0.875 nccl_fusion_max_ops ............................. 24 nccl_fusion_threshold_mb ........................ 16 num_classes ..................................... 1000 num_devices_per_node ............................ 8 num_epochs ...................................... 50 num_nodes ....................................... 1 ofrecord_part_num ............................... 256 ofrecord_path ................................... /dataset/79846248 print_interval .................................. 100 print_timestamp ................................. False samples_per_epoch ............................... 1281167 save_init ....................................... False save_path ....................................... None scale_grad ...................................... False skip_eval ....................................... False synthetic_data .................................. False total_batches ................................... -1 train_batch_size ................................ 192 train_global_batch_size ......................... 1536 use_fp16 ........................................ False use_gpu_decode .................................. False val_batch_size .................................. 50 val_batches_per_epoch ........................... 125 val_global_batch_size ........................... 400 val_samples_per_epoch ........................... 50000 warmup_epochs ................................... 5 weight_decay .................................... 3.0517578125e-05 zero_init_residual .............................. True -------------------- end of arguments --------------------- ***** Model Init ***** ***** Model Init Finish, time escapled: 2.63057 s ***** [rank:7] [train], epoch: 0/50, iter: 100/834, loss: 0.85918, lr: 0.035933, top1: 0.00438, throughput: 283.90 | 2022-04-03 06:27:33.682 [rank:6] [train], epoch: 0/50, iter: 100/834, loss: 0.85907, lr: 0.035933, top1: 0.00411, throughput: 284.07 | 2022-04-03 06:27:33.694 [rank:5] [train], epoch: 0/50, iter: 100/834, loss: 0.85916, lr: 0.035933, top1: 0.00417, throughput: 283.77 | 2022-04-03 06:27:33.704 [rank:2] [train], epoch: 0/50, iter: 100/834, loss: 0.85910, lr: 0.035933, top1: 0.00396, throughput: 283.91 | 2022-04-03 06:27:33.709 [rank:0] [train], epoch: 0/50, iter: 100/834, loss: 0.85939, lr: 0.035933, top1: 0.00406, throughput: 283.75 | 2022-04-03 06:27:33.726 [rank:1] [train], epoch: 0/50, iter: 100/834, loss: 0.85929, lr: 0.035933, top1: 0.00385, throughput: 283.40 | 2022-04-03 06:27:33.728 [rank:3] [train], epoch: 0/50, iter: 100/834, loss: 0.85938, lr: 0.035933, top1: 0.00375, throughput: 283.79 | 2022-04-03 06:27:33.741 [rank:4] [train], epoch: 0/50, iter: 100/834, loss: 0.85979, lr: 0.035933, top1: 0.00344, throughput: 283.77 | 2022-04-03 06:27:33.761 timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/04/03 06:27:33.847, Tesla V100-SXM2-32GB, 470.57.02, 47 %, 21 %, 32510 MiB, 11750 MiB, 20760 MiB 2022/04/03 06:27:33.853, Tesla V100-SXM2-32GB, 470.57.02, 46 %, 14 %, 32510 MiB, 11770 MiB, 20740 MiB 2022/04/03 06:27:33.859, Tesla V100-SXM2-32GB, 470.57.02, 60 %, 11 %, 32510 MiB, 11846 MiB, 20664 MiB 2022/04/03 06:27:33.866, Tesla V100-SXM2-32GB, 470.57.02, 41 %, 21 %, 32510 MiB, 11822 MiB, 20688 MiB 2022/04/03 06:27:33.872, Tesla V100-SXM2-32GB, 470.57.02, 28 %, 8 %, 32510 MiB, 11830 MiB, 20680 MiB 2022/04/03 06:27:33.887, Tesla V100-SXM2-32GB, 470.57.02, 81 %, 36 %, 32510 MiB, 11762 MiB, 20748 MiB 2022/04/03 06:27:33.895, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 54 %, 32510 MiB, 11706 MiB, 20804 MiB timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/04/03 06:27:33.901, Tesla V100-SXM2-32GB, 470.57.02, 89 %, 37 %, 32510 MiB, 11786 MiB, 20724 MiB 2022/04/03 06:27:33.904, Tesla V100-SXM2-32GB, 470.57.02, 47 %, 21 %, 32510 MiB, 11750 MiB, 20760 MiB 2022/04/03 06:27:33.911, Tesla V100-SXM2-32GB, 470.57.02, 46 %, 14 %, 32510 MiB, 11770 MiB, 20740 MiB 2022/04/03 06:27:33.937, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 76 %, 32510 MiB, 11846 MiB, 20664 MiB timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/04/03 06:27:33.962, Tesla V100-SXM2-32GB, 470.57.02, 91 %, 67 %, 32510 MiB, 11822 MiB, 20688 MiB timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/04/03 06:27:33.968, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 70 %, 32510 MiB, 11750 MiB, 20760 MiB 2022/04/03 06:27:33.984, Tesla V100-SXM2-32GB, 470.57.02, 76 %, 56 %, 32510 MiB, 11830 MiB, 20680 MiB 2022/04/03 06:27:33.999, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 70 %, 32510 MiB, 11750 MiB, 20760 MiB 2022/04/03 06:27:34.064, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 51 %, 32510 MiB, 11770 MiB, 20740 MiB 2022/04/03 06:27:34.065, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 65 %, 32510 MiB, 11762 MiB, 20748 MiB 2022/04/03 06:27:34.081, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 51 %, 32510 MiB, 11770 MiB, 20740 MiB 2022/04/03 06:27:34.127, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 51 %, 32510 MiB, 11846 MiB, 20664 MiB 2022/04/03 06:27:34.128, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 58 %, 32510 MiB, 11706 MiB, 20804 MiB timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/04/03 06:27:34.141, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 51 %, 32510 MiB, 11846 MiB, 20664 MiB 2022/04/03 06:27:34.161, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 55 %, 32510 MiB, 11822 MiB, 20688 MiB 2022/04/03 06:27:34.162, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 56 %, 32510 MiB, 11786 MiB, 20724 MiB 2022/04/03 06:27:34.164, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 54 %, 32510 MiB, 11822 MiB, 20688 MiB 2022/04/03 06:27:34.163, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 56 %, 32510 MiB, 11750 MiB, 20760 MiB 2022/04/03 06:27:34.188, Tesla V100-SXM2-32GB, 470.57.02, 98 %, 60 %, 32510 MiB, 11830 MiB, 20680 MiB 2022/04/03 06:27:34.205, Tesla V100-SXM2-32GB, 470.57.02, 98 %, 60 %, 32510 MiB, 11830 MiB, 20680 MiB 2022/04/03 06:27:34.207, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 51 %, 32510 MiB, 11770 MiB, 20740 MiB timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/04/03 06:27:34.222, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 59 %, 32510 MiB, 11762 MiB, 20748 MiB 2022/04/03 06:27:34.224, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 59 %, 32510 MiB, 11762 MiB, 20748 MiB 2022/04/03 06:27:34.225, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 51 %, 32510 MiB, 11846 MiB, 20664 MiB timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/04/03 06:27:34.228, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 56 %, 32510 MiB, 11750 MiB, 20760 MiB 2022/04/03 06:27:34.245, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 60 %, 32510 MiB, 11706 MiB, 20804 MiB 2022/04/03 06:27:34.247, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 60 %, 32510 MiB, 11706 MiB, 20804 MiB 2022/04/03 06:27:34.248, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 66 %, 32510 MiB, 11822 MiB, 20688 MiB 2022/04/03 06:27:34.258, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 69 %, 32510 MiB, 11770 MiB, 20740 MiB 2022/04/03 06:27:34.252, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 56 %, 32510 MiB, 11750 MiB, 20760 MiB timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/04/03 06:27:34.271, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 56 %, 32510 MiB, 11786 MiB, 20724 MiB 2022/04/03 06:27:34.296, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 56 %, 32510 MiB, 11786 MiB, 20724 MiB 2022/04/03 06:27:34.299, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 68 %, 32510 MiB, 11830 MiB, 20680 MiB 2022/04/03 06:27:34.303, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 68 %, 32510 MiB, 11846 MiB, 20664 MiB 2022/04/03 06:27:34.305, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 69 %, 32510 MiB, 11770 MiB, 20740 MiB 2022/04/03 06:27:34.314, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 66 %, 32510 MiB, 11750 MiB, 20760 MiB 2022/04/03 06:27:34.321, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 59 %, 32510 MiB, 11762 MiB, 20748 MiB 2022/04/03 06:27:34.322, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 66 %, 32510 MiB, 11822 MiB, 20688 MiB 2022/04/03 06:27:34.322, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 68 %, 32510 MiB, 11846 MiB, 20664 MiB 2022/04/03 06:27:34.332, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 69 %, 32510 MiB, 11770 MiB, 20740 MiB 2022/04/03 06:27:34.334, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 60 %, 32510 MiB, 11706 MiB, 20804 MiB 2022/04/03 06:27:34.335, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 68 %, 32510 MiB, 11830 MiB, 20680 MiB 2022/04/03 06:27:34.335, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 66 %, 32510 MiB, 11822 MiB, 20688 MiB 2022/04/03 06:27:34.341, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 68 %, 32510 MiB, 11846 MiB, 20664 MiB 2022/04/03 06:27:34.343, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 57 %, 32510 MiB, 11786 MiB, 20724 MiB 2022/04/03 06:27:34.345, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 59 %, 32510 MiB, 11762 MiB, 20748 MiB 2022/04/03 06:27:34.345, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 68 %, 32510 MiB, 11830 MiB, 20680 MiB 2022/04/03 06:27:34.348, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 66 %, 32510 MiB, 11822 MiB, 20688 MiB 2022/04/03 06:27:34.350, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 60 %, 32510 MiB, 11706 MiB, 20804 MiB 2022/04/03 06:27:34.350, Tesla V100-SXM2-32GB, 470.57.02, 82 %, 54 %, 32510 MiB, 11762 MiB, 20748 MiB 2022/04/03 06:27:34.354, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 68 %, 32510 MiB, 11830 MiB, 20680 MiB 2022/04/03 06:27:34.361, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 57 %, 32510 MiB, 11786 MiB, 20724 MiB 2022/04/03 06:27:34.361, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 60 %, 32510 MiB, 11706 MiB, 20804 MiB 2022/04/03 06:27:34.365, Tesla V100-SXM2-32GB, 470.57.02, 82 %, 54 %, 32510 MiB, 11762 MiB, 20748 MiB 2022/04/03 06:27:34.371, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 57 %, 32510 MiB, 11786 MiB, 20724 MiB 2022/04/03 06:27:34.373, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 60 %, 32510 MiB, 11706 MiB, 20804 MiB 2022/04/03 06:27:34.376, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 57 %, 32510 MiB, 11786 MiB, 20724 MiB [rank:5] [train], epoch: 0/50, iter: 200/834, loss: 0.82554, lr: 0.071866, top1: 0.01339, throughput: 311.71 | 2022-04-03 06:28:35.300 [rank:2] [train], epoch: 0/50, iter: 200/834, loss: 0.82602, lr: 0.071866, top1: 0.01328, throughput: 311.60 | 2022-04-03 06:28:35.326 [rank:4] [train], epoch: 0/50, iter: 200/834, loss: 0.82587, lr: 0.071866, top1: 0.01443, throughput: 311.77 | 2022-04-03 06:28:35.346 [rank:7] [train], epoch: 0/50, iter: 200/834, loss: 0.82656, lr: 0.071866, top1: 0.01328, throughput: 311.30 | 2022-04-03 06:28:35.359 [rank:1] [train], epoch: 0/50, iter: 200/834, loss: 0.82584, lr: 0.071866, top1: 0.01391, throughput: 311.53 | 2022-04-03 06:28:35.360 [rank:3] [train], epoch: 0/50, iter: 200/834, loss: 0.82645, lr: 0.071866, top1: 0.01370, throughput: 311.53 | 2022-04-03 06:28:35.372 [rank:0] [train], epoch: 0/50, iter: 200/834, loss: 0.82619, lr: 0.071866, top1: 0.01297, throughput: 311.40 | 2022-04-03 06:28:35.382 [rank:6] [train], epoch: 0/50, iter: 200/834, loss: 0.82534, lr: 0.071866, top1: 0.01359, throughput: 311.15 | 2022-04-03 06:28:35.402 [rank:1] [train], epoch: 0/50, iter: 300/834, loss: 0.80198, lr: 0.107799, top1: 0.02146, throughput: 310.03 | 2022-04-03 06:29:37.289 [rank:7] [train], epoch: 0/50, iter: 300/834, loss: 0.80180, lr: 0.107799, top1: 0.01984, throughput: 310.02 | 2022-04-03 06:29:37.290 [rank:0] [train], epoch: 0/50, iter: 300/834, loss: 0.80284, lr: 0.107799, top1: 0.02031, throughput: 310.04 | 2022-04-03 06:29:37.310 [rank:5] [train], epoch: 0/50, iter: 300/834, loss: 0.80240, lr: 0.107799, top1: 0.02016, throughput: 309.59 | 2022-04-03 06:29:37.318 [rank:3] [train], epoch: 0/50, iter: 300/834, loss: 0.80177, lr: 0.107799, top1: 0.02010, throughput: 309.89 | 2022-04-03 06:29:37.330 [rank:6] [train], epoch: 0/50, iter: 300/834, loss: 0.80276, lr: 0.107799, top1: 0.02083, throughput: 310.00 | 2022-04-03 06:29:37.337 [rank:4] [train], epoch: 0/50, iter: 300/834, loss: 0.80309, lr: 0.107799, top1: 0.01755, throughput: 309.69 | 2022-04-03 06:29:37.343 [rank:2] [train], epoch: 0/50, iter: 300/834, loss: 0.80276, lr: 0.107799, top1: 0.01979, throughput: 309.52 | 2022-04-03 06:29:37.358 [rank:1] [train], epoch: 0/50, iter: 400/834, loss: 0.78493, lr: 0.143733, top1: 0.02729, throughput: 311.82 | 2022-04-03 06:30:38.863 [rank:5] [train], epoch: 0/50, iter: 400/834, loss: 0.78532, lr: 0.143733, top1: 0.02396, throughput: 311.91 | 2022-04-03 06:30:38.874 [rank:4] [train], epoch: 0/50, iter: 400/834, loss: 0.78591, lr: 0.143733, top1: 0.02568, throughput: 312.04 | 2022-04-03 06:30:38.875 [rank:6] [train], epoch: 0/50, iter: 400/834, loss: 0.78524, lr: 0.143733, top1: 0.02589, throughput: 311.96 | 2022-04-03 06:30:38.883 [rank:3] [train], epoch: 0/50, iter: 400/834, loss: 0.78459, lr: 0.143733, top1: 0.02792, throughput: 311.89 | 2022-04-03 06:30:38.890 [rank:7] [train], epoch: 0/50, iter: 400/834, loss: 0.78641, lr: 0.143733, top1: 0.02422, throughput: 311.64 | 2022-04-03 06:30:38.900 [rank:0] [train], epoch: 0/50, iter: 400/834, loss: 0.78570, lr: 0.143733, top1: 0.02760, throughput: 311.64 | 2022-04-03 06:30:38.919 [rank:2] [train], epoch: 0/50, iter: 400/834, loss: 0.78477, lr: 0.143733, top1: 0.02667, throughput: 312.28 | 2022-04-03 06:30:38.841 [rank:1] [train], epoch: 0/50, iter: 500/834, loss: 0.77043, lr: 0.179666, top1: 0.03234, throughput: 311.52 | 2022-04-03 06:31:40.497 [rank:2] [train], epoch: 0/50, iter: 500/834, loss: 0.77056, lr: 0.179666, top1: 0.03016, throughput: 311.37 | 2022-04-03 06:31:40.503 [rank:6] [train], epoch: 0/50, iter: 500/834, loss: 0.76982, lr: 0.179666, top1: 0.03422, throughput: 311.55 | 2022-04-03 06:31:40.510 [rank:7] [train], epoch: 0/50, iter: 500/834, loss: 0.77103, lr: 0.179666, top1: 0.03417, throughput: 311.56 | 2022-04-03 06:31:40.526 [rank:3] [train], epoch: 0/50, iter: 500/834, loss: 0.76774, lr: 0.179666, top1: 0.03208, throughput: 311.49 | 2022-04-03 06:31:40.529 [rank:0] [train], epoch: 0/50, iter: 500/834, loss: 0.76840, lr: 0.179666, top1: 0.03188, throughput: 311.61 | 2022-04-03 06:31:40.535 [rank:5] [train], epoch: 0/50, iter: 500/834, loss: 0.77025, lr: 0.179666, top1: 0.03365, throughput: 311.35 | 2022-04-03 06:31:40.541 [rank:4] [train], epoch: 0/50, iter: 500/834, loss: 0.76973, lr: 0.179666, top1: 0.03349, throughput: 311.30 | 2022-04-03 06:31:40.552 [rank:1] [train], epoch: 0/50, iter: 600/834, loss: 0.75506, lr: 0.215599, top1: 0.04099, throughput: 310.61 | 2022-04-03 06:32:42.311 [rank:3] [train], epoch: 0/50, iter: 600/834, loss: 0.75344, lr: 0.215599, top1: 0.04177, throughput: 310.74 | 2022-04-03 06:32:42.317 [rank:4] [train], epoch: 0/50, iter: 600/834, loss: 0.75434, lr: 0.215599, top1: 0.04068, throughput: 310.77 | 2022-04-03 06:32:42.334 [rank:6] [train], epoch: 0/50, iter: 600/834, loss: 0.75482, lr: 0.215599, top1: 0.04141, throughput: 310.45 | 2022-04-03 06:32:42.354 [rank:5] [train], epoch: 0/50, iter: 600/834, loss: 0.75426, lr: 0.215599, top1: 0.04500, throughput: 310.60 | 2022-04-03 06:32:42.356 [rank:7] [train], epoch: 0/50, iter: 600/834, loss: 0.75657, lr: 0.215599, top1: 0.04089, throughput: 310.40 | 2022-04-03 06:32:42.381 [rank:0] [train], epoch: 0/50, iter: 600/834, loss: 0.75575, lr: 0.215599, top1: 0.03984, throughput: 310.39 | 2022-04-03 06:32:42.393 [rank:2] [train], epoch: 0/50, iter: 600/834, loss: 0.75487, lr: 0.215599, top1: 0.04281, throughput: 310.09 | 2022-04-03 06:32:42.421 [rank:0] [train], epoch: 0/50, iter: 700/834, loss: 0.74049, lr: 0.251532, top1: 0.05135, throughput: 311.68 | 2022-04-03 06:33:43.994 [rank:1] [train], epoch: 0/50, iter: 700/834, loss: 0.73853, lr: 0.251532, top1: 0.05047, throughput: 311.23 | 2022-04-03 06:33:44.003 [rank:3] [train], epoch: 0/50, iter: 700/834, loss: 0.73904, lr: 0.251532, top1: 0.04953, throughput: 311.25 | 2022-04-03 06:33:44.003 [rank:6] [train], epoch: 0/50, iter: 700/834, loss: 0.73989, lr: 0.251532, top1: 0.05089, throughput: 311.38 | 2022-04-03 06:33:44.015 [rank:5] [train], epoch: 0/50, iter: 700/834, loss: 0.73902, lr: 0.251532, top1: 0.05172, throughput: 311.31 | 2022-04-03 06:33:44.031 [rank:4] [train], epoch: 0/50, iter: 700/834, loss: 0.73782, lr: 0.251532, top1: 0.04812, throughput: 311.14 | 2022-04-03 06:33:44.041 [rank:2] [train], epoch: 0/50, iter: 700/834, loss: 0.73926, lr: 0.251532, top1: 0.05193, throughput: 311.55 | 2022-04-03 06:33:44.049 [rank:7] [train], epoch: 0/50, iter: 700/834, loss: 0.73943, lr: 0.251532, top1: 0.04938, throughput: 311.23 | 2022-04-03 06:33:44.072 [rank:1] [train], epoch: 0/50, iter: 800/834, loss: 0.72380, lr: 0.287465, top1: 0.05880, throughput: 311.60 | 2022-04-03 06:34:45.620 [rank:5] [train], epoch: 0/50, iter: 800/834, loss: 0.72518, lr: 0.287465, top1: 0.06089, throughput: 311.50 | 2022-04-03 06:34:45.668 [rank:7] [train], epoch: 0/50, iter: 800/834, loss: 0.72573, lr: 0.287465, top1: 0.05594, throughput: 311.67 | 2022-04-03 06:34:45.675 [rank:6] [train], epoch: 0/50, iter: 800/834, loss: 0.72246, lr: 0.287465, top1: 0.06276, throughput: 311.39 | 2022-04-03 06:34:45.675 [rank:3] [train], epoch: 0/50, iter: 800/834, loss: 0.72515, lr: 0.287465, top1: 0.06281, throughput: 311.25 | 2022-04-03 06:34:45.690 [rank:0] [train], epoch: 0/50, iter: 800/834, loss: 0.72517, lr: 0.287465, top1: 0.06042, throughput: 311.19 | 2022-04-03 06:34:45.693 [rank:4] [train], epoch: 0/50, iter: 800/834, loss: 0.72469, lr: 0.287465, top1: 0.05880, throughput: 311.34 | 2022-04-03 06:34:45.710 [rank:2] [train], epoch: 0/50, iter: 800/834, loss: 0.72526, lr: 0.287465, top1: 0.05833, throughput: 311.36 | 2022-04-03 06:34:45.713 [rank:3] [train], epoch: 0/50, iter: 834/834, loss: 0.71703, lr: 0.299682, top1: 0.06556, throughput: 311.28 | 2022-04-03 06:35:06.661 [rank:5] [train], epoch: 0/50, iter: 834/834, loss: 0.71561, lr: 0.299682, top1: 0.06725, throughput: 310.89 | 2022-04-03 06:35:06.665 [rank:2] [train], epoch: 0/50, iter: 834/834, loss: 0.71481, lr: 0.299682, top1: 0.06801, throughput: 311.52 | 2022-04-03 06:35:06.669 [rank:0] [train], epoch: 0/50, iter: 834/834, loss: 0.71253, lr: 0.299682, top1: 0.07184, throughput: 311.19 | 2022-04-03 06:35:06.671 [rank:1] [train], epoch: 0/50, iter: 834/834, loss: 0.71580, lr: 0.299682, top1: 0.06281, throughput: 309.97 | 2022-04-03 06:35:06.680 [rank:6] [train], epoch: 0/50, iter: 834/834, loss: 0.71509, lr: 0.299682, top1: 0.06740, throughput: 310.73 | 2022-04-03 06:35:06.683 [rank:4] [train], epoch: 0/50, iter: 834/834, loss: 0.71643, lr: 0.299682, top1: 0.05898, throughput: 311.23 | 2022-04-03 06:35:06.684 [rank:7] [train], epoch: 0/50, iter: 834/834, loss: 0.71662, lr: 0.299682, top1: 0.06388, throughput: 310.28 | 2022-04-03 06:35:06.714 [rank:1] [eval], epoch: 0/50, iter: 125/125, loss: 0.00000, lr: 0.299682, top1: 0.07824, throughput: 472.50 | 2022-04-03 06:35:19.908 [rank:0] [eval], epoch: 0/50, iter: 125/125, loss: 0.00000, lr: 0.299682, top1: 0.07360, throughput: 471.60 | 2022-04-03 06:35:19.924 [rank:4] [eval], epoch: 0/50, iter: 125/125, loss: 0.00000, lr: 0.299682, top1: 0.07888, throughput: 472.01 | 2022-04-03 06:35:19.926 [rank:7] [eval], epoch: 0/50, iter: 125/125, loss: 0.00000, lr: 0.299682, top1: 0.07408, throughput: 472.73 | 2022-04-03 06:35:19.935 [rank:2] [eval], epoch: 0/50, iter: 125/125, loss: 0.00000, lr: 0.299682, top1: 0.07792, throughput: 470.91 | 2022-04-03 06:35:19.941 [rank:6] [eval], epoch: 0/50, iter: 125/125, loss: 0.00000, lr: 0.299682, top1: 0.07952, throughput: 471.07 | 2022-04-03 06:35:19.951 [rank:5] [eval], epoch: 0/50, iter: 125/125, loss: 0.00000, lr: 0.299682, top1: 0.07712, throughput: 470.42 | 2022-04-03 06:35:19.952 [rank:3] [eval], epoch: 0/50, iter: 125/125, loss: 0.00000, lr: 0.299682, top1: 0.07248, throughput: 466.37 | 2022-04-03 06:35:20.062 [rank:0] [train], epoch: 1/50, iter: 100/834, loss: 0.70336, lr: 0.335615, top1: 0.07547, throughput: 313.31 | 2022-04-03 06:36:21.205 [rank:5] [train], epoch: 1/50, iter: 100/834, loss: 0.70379, lr: 0.335615, top1: 0.07906, throughput: 313.37 | 2022-04-03 06:36:21.220 [rank:4] [train], epoch: 1/50, iter: 100/834, loss: 0.70583, lr: 0.335615, top1: 0.07177, throughput: 313.21 | 2022-04-03 06:36:21.225 [rank:7] [train], epoch: 1/50, iter: 100/834, loss: 0.70511, lr: 0.335615, top1: 0.07531, throughput: 313.24 | 2022-04-03 06:36:21.230 [rank:3] [train], epoch: 1/50, iter: 100/834, loss: 0.70410, lr: 0.335615, top1: 0.07182, throughput: 314.18 | 2022-04-03 06:36:21.174 [rank:2] [train], epoch: 1/50, iter: 100/834, loss: 0.70314, lr: 0.335615, top1: 0.07703, throughput: 313.13 | 2022-04-03 06:36:21.258 [rank:6] [train], epoch: 1/50, iter: 100/834, loss: 0.70607, lr: 0.335615, top1: 0.07552, throughput: 313.60 | 2022-04-03 06:36:21.175 [rank:1] [train], epoch: 1/50, iter: 100/834, loss: 0.70410, lr: 0.335615, top1: 0.07641, throughput: 312.81 | 2022-04-03 06:36:21.286 [rank:5] [train], epoch: 1/50, iter: 200/834, loss: 0.68742, lr: 0.371549, top1: 0.09203, throughput: 311.24 | 2022-04-03 06:37:22.910 [rank:4] [train], epoch: 1/50, iter: 200/834, loss: 0.68766, lr: 0.371549, top1: 0.09089, throughput: 311.19 | 2022-04-03 06:37:22.925 [rank:3] [train], epoch: 1/50, iter: 200/834, loss: 0.68827, lr: 0.371549, top1: 0.08995, throughput: 310.88 | 2022-04-03 06:37:22.933 [rank:0] [train], epoch: 1/50, iter: 200/834, loss: 0.68771, lr: 0.371549, top1: 0.08974, throughput: 311.00 | 2022-04-03 06:37:22.941 [rank:7] [train], epoch: 1/50, iter: 200/834, loss: 0.68706, lr: 0.371549, top1: 0.09083, throughput: 311.00 | 2022-04-03 06:37:22.965 [rank:2] [train], epoch: 1/50, iter: 200/834, loss: 0.68520, lr: 0.371549, top1: 0.08698, throughput: 311.13 | 2022-04-03 06:37:22.968 [rank:6] [train], epoch: 1/50, iter: 200/834, loss: 0.68925, lr: 0.371549, top1: 0.08698, throughput: 310.66 | 2022-04-03 06:37:22.979 [rank:1] [train], epoch: 1/50, iter: 200/834, loss: 0.68826, lr: 0.371549, top1: 0.08833, throughput: 311.06 | 2022-04-03 06:37:23.011 [rank:3] [train], epoch: 1/50, iter: 300/834, loss: 0.67324, lr: 0.407482, top1: 0.10443, throughput: 311.45 | 2022-04-03 06:38:24.581 [rank:5] [train], epoch: 1/50, iter: 300/834, loss: 0.67322, lr: 0.407482, top1: 0.10339, throughput: 311.15 | 2022-04-03 06:38:24.617 [rank:1] [train], epoch: 1/50, iter: 300/834, loss: 0.67553, lr: 0.407482, top1: 0.09797, throughput: 311.58 | 2022-04-03 06:38:24.632 [rank:4] [train], epoch: 1/50, iter: 300/834, loss: 0.67334, lr: 0.407482, top1: 0.10297, throughput: 311.13 | 2022-04-03 06:38:24.635 [rank:7] [train], epoch: 1/50, iter: 300/834, loss: 0.67182, lr: 0.407482, top1: 0.10203, throughput: 311.23 | 2022-04-03 06:38:24.656 [rank:6] [train], epoch: 1/50, iter: 300/834, loss: 0.67449, lr: 0.407482, top1: 0.10214, throughput: 311.18 | 2022-04-03 06:38:24.680 [rank:0] [train], epoch: 1/50, iter: 300/834, loss: 0.67195, lr: 0.407482, top1: 0.10365, throughput: 310.84 | 2022-04-03 06:38:24.709 [rank:2] [train], epoch: 1/50, iter: 300/834, loss: 0.67305, lr: 0.407482, top1: 0.10281, throughput: 310.97 | 2022-04-03 06:38:24.711 [rank:5] [train], epoch: 1/50, iter: 400/834, loss: 0.65666, lr: 0.443415, top1: 0.11745, throughput: 312.45 | 2022-04-03 06:39:26.067 [rank:1] [train], epoch: 1/50, iter: 400/834, loss: 0.65651, lr: 0.443415, top1: 0.11776, throughput: 312.51 | 2022-04-03 06:39:26.070 [rank:3] [train], epoch: 1/50, iter: 400/834, loss: 0.66114, lr: 0.443415, top1: 0.11401, throughput: 312.19 | 2022-04-03 06:39:26.081 [rank:4] [train], epoch: 1/50, iter: 400/834, loss: 0.65916, lr: 0.443415, top1: 0.11286, throughput: 312.33 | 2022-04-03 06:39:26.109 [rank:0] [train], epoch: 1/50, iter: 400/834, loss: 0.65496, lr: 0.443415, top1: 0.11885, throughput: 312.56 | 2022-04-03 06:39:26.138 [rank:7] [train], epoch: 1/50, iter: 400/834, loss: 0.65856, lr: 0.443415, top1: 0.11224, throughput: 312.29 | 2022-04-03 06:39:26.138 [rank:6] [train], epoch: 1/50, iter: 400/834, loss: 0.66046, lr: 0.443415, top1: 0.11229, throughput: 312.81 | 2022-04-03 06:39:26.058 [rank:2] [train], epoch: 1/50, iter: 400/834, loss: 0.65827, lr: 0.443415, top1: 0.11156, throughput: 312.38 | 2022-04-03 06:39:26.174 [rank:4] [train], epoch: 1/50, iter: 500/834, loss: 0.64013, lr: 0.479348, top1: 0.13464, throughput: 310.85 | 2022-04-03 06:40:27.875 [rank:3] [train], epoch: 1/50, iter: 500/834, loss: 0.64272, lr: 0.479348, top1: 0.13172, throughput: 310.56 | 2022-04-03 06:40:27.905 [rank:2] [train], epoch: 1/50, iter: 500/834, loss: 0.64397, lr: 0.479348, top1: 0.12844, throughput: 310.95 | 2022-04-03 06:40:27.919 [rank:7] [train], epoch: 1/50, iter: 500/834, loss: 0.64305, lr: 0.479348, top1: 0.13146, throughput: 310.66 | 2022-04-03 06:40:27.942 [rank:0] [train], epoch: 1/50, iter: 500/834, loss: 0.64394, lr: 0.479348, top1: 0.12807, throughput: 310.65 | 2022-04-03 06:40:27.944 [rank:6] [train], epoch: 1/50, iter: 500/834, loss: 0.64386, lr: 0.479348, top1: 0.12896, throughput: 310.23 | 2022-04-03 06:40:27.948 [rank:1] [train], epoch: 1/50, iter: 500/834, loss: 0.64189, lr: 0.479348, top1: 0.13120, throughput: 310.24 | 2022-04-03 06:40:27.958 [rank:5] [train], epoch: 1/50, iter: 500/834, loss: 0.63965, lr: 0.479348, top1: 0.13458, throughput: 310.18 | 2022-04-03 06:40:27.966 [rank:2] [train], epoch: 1/50, iter: 600/834, loss: 0.62733, lr: 0.515281, top1: 0.14682, throughput: 311.01 | 2022-04-03 06:41:29.654 [rank:4] [train], epoch: 1/50, iter: 600/834, loss: 0.62801, lr: 0.515281, top1: 0.14120, throughput: 310.68 | 2022-04-03 06:41:29.675 [rank:1] [train], epoch: 1/50, iter: 600/834, loss: 0.62735, lr: 0.515281, top1: 0.15052, throughput: 311.05 | 2022-04-03 06:41:29.684 [rank:3] [train], epoch: 1/50, iter: 600/834, loss: 0.62831, lr: 0.515281, top1: 0.14682, throughput: 310.77 | 2022-04-03 06:41:29.687 [rank:5] [train], epoch: 1/50, iter: 600/834, loss: 0.62634, lr: 0.515281, top1: 0.14885, throughput: 310.95 | 2022-04-03 06:41:29.712 [rank:0] [train], epoch: 1/50, iter: 600/834, loss: 0.62647, lr: 0.515281, top1: 0.14510, throughput: 310.84 | 2022-04-03 06:41:29.712 [rank:7] [train], epoch: 1/50, iter: 600/834, loss: 0.62595, lr: 0.515281, top1: 0.14849, throughput: 310.83 | 2022-04-03 06:41:29.713 [rank:6] [train], epoch: 1/50, iter: 600/834, loss: 0.62730, lr: 0.515281, top1: 0.15104, throughput: 310.64 | 2022-04-03 06:41:29.757 [rank:1] [train], epoch: 1/50, iter: 700/834, loss: 0.61356, lr: 0.551214, top1: 0.16161, throughput: 311.27 | 2022-04-03 06:42:31.367 [rank:3] [train], epoch: 1/50, iter: 700/834, loss: 0.61258, lr: 0.551214, top1: 0.16417, throughput: 311.25 | 2022-04-03 06:42:31.373 [rank:5] [train], epoch: 1/50, iter: 700/834, loss: 0.61567, lr: 0.551214, top1: 0.16182, throughput: 311.27 | 2022-04-03 06:42:31.394 [rank:7] [train], epoch: 1/50, iter: 700/834, loss: 0.61429, lr: 0.551214, top1: 0.16104, throughput: 311.12 | 2022-04-03 06:42:31.426 [rank:4] [train], epoch: 1/50, iter: 700/834, loss: 0.61438, lr: 0.551214, top1: 0.15807, throughput: 310.92 | 2022-04-03 06:42:31.426 [rank:0] [train], epoch: 1/50, iter: 700/834, loss: 0.61106, lr: 0.551214, top1: 0.16411, throughput: 311.04 | 2022-04-03 06:42:31.441 [rank:2] [train], epoch: 1/50, iter: 700/834, loss: 0.61125, lr: 0.551214, top1: 0.16333, throughput: 310.71 | 2022-04-03 06:42:31.448 [rank:6] [train], epoch: 1/50, iter: 700/834, loss: 0.61888, lr: 0.551214, top1: 0.15625, throughput: 311.65 | 2022-04-03 06:42:31.364 [rank:4] [train], epoch: 1/50, iter: 800/834, loss: 0.60221, lr: 0.587147, top1: 0.17365, throughput: 312.47 | 2022-04-03 06:43:32.871 [rank:7] [train], epoch: 1/50, iter: 800/834, loss: 0.60015, lr: 0.587147, top1: 0.17911, throughput: 312.24 | 2022-04-03 06:43:32.917 [rank:6] [train], epoch: 1/50, iter: 800/834, loss: 0.59955, lr: 0.587147, top1: 0.17948, throughput: 311.87 | 2022-04-03 06:43:32.929 [rank:3] [train], epoch: 1/50, iter: 800/834, loss: 0.59982, lr: 0.587147, top1: 0.17583, throughput: 311.87 | 2022-04-03 06:43:32.937 [rank:0] [train], epoch: 1/50, iter: 800/834, loss: 0.59952, lr: 0.587147, top1: 0.17740, throughput: 312.11 | 2022-04-03 06:43:32.957 [rank:5] [train], epoch: 1/50, iter: 800/834, loss: 0.60110, lr: 0.587147, top1: 0.17661, throughput: 311.84 | 2022-04-03 06:43:32.964 [rank:1] [train], epoch: 1/50, iter: 800/834, loss: 0.59744, lr: 0.587147, top1: 0.18250, throughput: 311.62 | 2022-04-03 06:43:32.980 [rank:2] [train], epoch: 1/50, iter: 800/834, loss: 0.59955, lr: 0.587147, top1: 0.17380, throughput: 311.96 | 2022-04-03 06:43:32.994 [rank:6] [train], epoch: 1/50, iter: 834/834, loss: 0.59068, lr: 0.599365, top1: 0.17754, throughput: 311.65 | 2022-04-03 06:43:53.876 [rank:4] [train], epoch: 1/50, iter: 834/834, loss: 0.59441, lr: 0.599365, top1: 0.18490, throughput: 310.73 | 2022-04-03 06:43:53.879 [rank:3] [train], epoch: 1/50, iter: 834/834, loss: 0.58804, lr: 0.599365, top1: 0.18704, throughput: 311.68 | 2022-04-03 06:43:53.881 [rank:1] [train], epoch: 1/50, iter: 834/834, loss: 0.59317, lr: 0.599365, top1: 0.18673, throughput: 312.29 | 2022-04-03 06:43:53.884 [rank:7] [train], epoch: 1/50, iter: 834/834, loss: 0.59165, lr: 0.599365, top1: 0.18903, throughput: 311.31 | 2022-04-03 06:43:53.887 [rank:0] [train], epoch: 1/50, iter: 834/834, loss: 0.58527, lr: 0.599365, top1: 0.19807, throughput: 311.77 | 2022-04-03 06:43:53.896 [rank:5] [train], epoch: 1/50, iter: 834/834, loss: 0.59622, lr: 0.599365, top1: 0.17525, throughput: 311.85 | 2022-04-03 06:43:53.897 [rank:2] [train], epoch: 1/50, iter: 834/834, loss: 0.58903, lr: 0.599365, top1: 0.19301, throughput: 311.69 | 2022-04-03 06:43:53.938 [rank:0] [eval], epoch: 1/50, iter: 125/125, loss: 0.00000, lr: 0.599365, top1: 0.17216, throughput: 485.67 | 2022-04-03 06:44:06.765 [rank:1] [eval], epoch: 1/50, iter: 125/125, loss: 0.00000, lr: 0.599365, top1: 0.16672, throughput: 484.93 | 2022-04-03 06:44:06.773 [rank:6] [eval], epoch: 1/50, iter: 125/125, loss: 0.00000, lr: 0.599365, top1: 0.16816, throughput: 484.42 | 2022-04-03 06:44:06.778 [rank:4] [eval], epoch: 1/50, iter: 125/125, loss: 0.00000, lr: 0.599365, top1: 0.16448, throughput: 484.46 | 2022-04-03 06:44:06.780 [rank:7] [eval], epoch: 1/50, iter: 125/125, loss: 0.00000, lr: 0.599365, top1: 0.16640, throughput: 484.71 | 2022-04-03 06:44:06.781 [rank:2] [eval], epoch: 1/50, iter: 125/125, loss: 0.00000, lr: 0.599365, top1: 0.17632, throughput: 486.63 | 2022-04-03 06:44:06.781 [rank:5] [eval], epoch: 1/50, iter: 125/125, loss: 0.00000, lr: 0.599365, top1: 0.16448, throughput: 485.05 | 2022-04-03 06:44:06.782 [rank:3] [eval], epoch: 1/50, iter: 125/125, loss: 0.00000, lr: 0.599365, top1: 0.16496, throughput: 483.62 | 2022-04-03 06:44:06.804 [rank:3] [train], epoch: 2/50, iter: 100/834, loss: 0.58315, lr: 0.635298, top1: 0.19932, throughput: 312.84 | 2022-04-03 06:45:08.178 [rank:5] [train], epoch: 2/50, iter: 100/834, loss: 0.57957, lr: 0.635298, top1: 0.20240, throughput: 312.68 | 2022-04-03 06:45:08.186 [rank:0] [train], epoch: 2/50, iter: 100/834, loss: 0.58101, lr: 0.635298, top1: 0.20359, throughput: 312.56 | 2022-04-03 06:45:08.194 [rank:2] [train], epoch: 2/50, iter: 100/834, loss: 0.58155, lr: 0.635298, top1: 0.20380, throughput: 312.59 | 2022-04-03 06:45:08.204 [rank:6] [train], epoch: 2/50, iter: 100/834, loss: 0.57933, lr: 0.635298, top1: 0.20422, throughput: 312.45 | 2022-04-03 06:45:08.227 [rank:4] [train], epoch: 2/50, iter: 100/834, loss: 0.58252, lr: 0.635298, top1: 0.19943, throughput: 312.42 | 2022-04-03 06:45:08.236 [rank:7] [train], epoch: 2/50, iter: 100/834, loss: 0.58106, lr: 0.635298, top1: 0.19964, throughput: 312.37 | 2022-04-03 06:45:08.247 [rank:1] [train], epoch: 2/50, iter: 100/834, loss: 0.58114, lr: 0.635298, top1: 0.19849, throughput: 312.30 | 2022-04-03 06:45:08.251 [rank:2] [train], epoch: 2/50, iter: 200/834, loss: 0.57256, lr: 0.671231, top1: 0.21135, throughput: 309.90 | 2022-04-03 06:46:10.159 [rank:5] [train], epoch: 2/50, iter: 200/834, loss: 0.56730, lr: 0.671231, top1: 0.22125, throughput: 309.78 | 2022-04-03 06:46:10.166 [rank:1] [train], epoch: 2/50, iter: 200/834, loss: 0.56899, lr: 0.671231, top1: 0.21583, throughput: 310.07 | 2022-04-03 06:46:10.173 [rank:6] [train], epoch: 2/50, iter: 200/834, loss: 0.56846, lr: 0.671231, top1: 0.21260, throughput: 309.94 | 2022-04-03 06:46:10.175 [rank:7] [train], epoch: 2/50, iter: 200/834, loss: 0.57248, lr: 0.671231, top1: 0.21010, throughput: 309.90 | 2022-04-03 06:46:10.203 [rank:4] [train], epoch: 2/50, iter: 200/834, loss: 0.57044, lr: 0.671231, top1: 0.21396, throughput: 309.80 | 2022-04-03 06:46:10.213 [rank:0] [train], epoch: 2/50, iter: 200/834, loss: 0.57127, lr: 0.671231, top1: 0.21172, throughput: 309.48 | 2022-04-03 06:46:10.234 [rank:3] [train], epoch: 2/50, iter: 200/834, loss: 0.57099, lr: 0.671231, top1: 0.21599, throughput: 309.27 | 2022-04-03 06:46:10.259 [rank:5] [train], epoch: 2/50, iter: 300/834, loss: 0.56089, lr: 0.707164, top1: 0.22557, throughput: 313.70 | 2022-04-03 06:47:11.370 [rank:6] [train], epoch: 2/50, iter: 300/834, loss: 0.55980, lr: 0.707164, top1: 0.22948, throughput: 313.70 | 2022-04-03 06:47:11.380 [rank:1] [train], epoch: 2/50, iter: 300/834, loss: 0.55864, lr: 0.707164, top1: 0.22755, throughput: 313.66 | 2022-04-03 06:47:11.386 [rank:3] [train], epoch: 2/50, iter: 300/834, loss: 0.55928, lr: 0.707164, top1: 0.22901, throughput: 314.02 | 2022-04-03 06:47:11.401 [rank:0] [train], epoch: 2/50, iter: 300/834, loss: 0.55834, lr: 0.707164, top1: 0.22958, throughput: 313.88 | 2022-04-03 06:47:11.403 [rank:4] [train], epoch: 2/50, iter: 300/834, loss: 0.56279, lr: 0.707164, top1: 0.22318, throughput: 313.77 | 2022-04-03 06:47:11.403 [rank:2] [train], epoch: 2/50, iter: 300/834, loss: 0.56113, lr: 0.707164, top1: 0.22766, throughput: 313.45 | 2022-04-03 06:47:11.412 [rank:7] [train], epoch: 2/50, iter: 300/834, loss: 0.56296, lr: 0.707164, top1: 0.22365, throughput: 313.60 | 2022-04-03 06:47:11.427 [rank:3] [train], epoch: 2/50, iter: 400/834, loss: 0.55082, lr: 0.743097, top1: 0.23641, throughput: 311.73 | 2022-04-03 06:48:12.994 [rank:5] [train], epoch: 2/50, iter: 400/834, loss: 0.54937, lr: 0.743097, top1: 0.24109, throughput: 311.56 | 2022-04-03 06:48:12.995 [rank:1] [train], epoch: 2/50, iter: 400/834, loss: 0.55128, lr: 0.743097, top1: 0.24125, throughput: 311.60 | 2022-04-03 06:48:13.003 [rank:6] [train], epoch: 2/50, iter: 400/834, loss: 0.55123, lr: 0.743097, top1: 0.24016, throughput: 311.56 | 2022-04-03 06:48:13.006 [rank:2] [train], epoch: 2/50, iter: 400/834, loss: 0.55010, lr: 0.743097, top1: 0.23995, throughput: 311.62 | 2022-04-03 06:48:13.026 [rank:4] [train], epoch: 2/50, iter: 400/834, loss: 0.54819, lr: 0.743097, top1: 0.24500, throughput: 311.53 | 2022-04-03 06:48:13.035 [rank:7] [train], epoch: 2/50, iter: 400/834, loss: 0.55202, lr: 0.743097, top1: 0.23385, throughput: 312.01 | 2022-04-03 06:48:12.964 [rank:0] [train], epoch: 2/50, iter: 400/834, loss: 0.54974, lr: 0.743097, top1: 0.23901, throughput: 311.44 | 2022-04-03 06:48:13.052 [rank:4] [train], epoch: 2/50, iter: 500/834, loss: 0.53929, lr: 0.779030, top1: 0.25422, throughput: 310.79 | 2022-04-03 06:49:14.813 [rank:2] [train], epoch: 2/50, iter: 500/834, loss: 0.54133, lr: 0.779030, top1: 0.25219, throughput: 310.74 | 2022-04-03 06:49:14.813 [rank:7] [train], epoch: 2/50, iter: 500/834, loss: 0.54255, lr: 0.779030, top1: 0.25188, throughput: 310.43 | 2022-04-03 06:49:14.813 [rank:5] [train], epoch: 2/50, iter: 500/834, loss: 0.53848, lr: 0.779030, top1: 0.25776, throughput: 310.45 | 2022-04-03 06:49:14.841 [rank:6] [train], epoch: 2/50, iter: 500/834, loss: 0.53875, lr: 0.779030, top1: 0.25443, throughput: 310.47 | 2022-04-03 06:49:14.847 [rank:3] [train], epoch: 2/50, iter: 500/834, loss: 0.54156, lr: 0.779030, top1: 0.25417, throughput: 310.40 | 2022-04-03 06:49:14.849 [rank:0] [train], epoch: 2/50, iter: 500/834, loss: 0.54136, lr: 0.779030, top1: 0.24958, throughput: 310.63 | 2022-04-03 06:49:14.862 [rank:1] [train], epoch: 2/50, iter: 500/834, loss: 0.54287, lr: 0.779030, top1: 0.25234, throughput: 310.36 | 2022-04-03 06:49:14.866 [rank:6] [train], epoch: 2/50, iter: 600/834, loss: 0.53489, lr: 0.814963, top1: 0.26427, throughput: 313.00 | 2022-04-03 06:50:16.189 [rank:1] [train], epoch: 2/50, iter: 600/834, loss: 0.53282, lr: 0.814963, top1: 0.26589, throughput: 313.08 | 2022-04-03 06:50:16.193 [rank:2] [train], epoch: 2/50, iter: 600/834, loss: 0.53066, lr: 0.814963, top1: 0.26734, throughput: 312.79 | 2022-04-03 06:50:16.196 [rank:5] [train], epoch: 2/50, iter: 600/834, loss: 0.53024, lr: 0.814963, top1: 0.26901, throughput: 312.89 | 2022-04-03 06:50:16.204 [rank:7] [train], epoch: 2/50, iter: 600/834, loss: 0.53159, lr: 0.814963, top1: 0.26776, throughput: 312.61 | 2022-04-03 06:50:16.232 [rank:4] [train], epoch: 2/50, iter: 600/834, loss: 0.53186, lr: 0.814963, top1: 0.26547, throughput: 312.57 | 2022-04-03 06:50:16.239 [rank:3] [train], epoch: 2/50, iter: 600/834, loss: 0.52755, lr: 0.814963, top1: 0.27344, throughput: 312.70 | 2022-04-03 06:50:16.249 [rank:0] [train], epoch: 2/50, iter: 600/834, loss: 0.53047, lr: 0.814963, top1: 0.26635, throughput: 312.76 | 2022-04-03 06:50:16.250 [rank:5] [train], epoch: 2/50, iter: 700/834, loss: 0.52258, lr: 0.850896, top1: 0.27521, throughput: 312.41 | 2022-04-03 06:51:17.662 [rank:3] [train], epoch: 2/50, iter: 700/834, loss: 0.52120, lr: 0.850896, top1: 0.28083, throughput: 312.37 | 2022-04-03 06:51:17.714 [rank:7] [train], epoch: 2/50, iter: 700/834, loss: 0.52520, lr: 0.850896, top1: 0.27172, throughput: 312.21 | 2022-04-03 06:51:17.730 [rank:6] [train], epoch: 2/50, iter: 700/834, loss: 0.52244, lr: 0.850896, top1: 0.27937, throughput: 311.91 | 2022-04-03 06:51:17.746 [rank:4] [train], epoch: 2/50, iter: 700/834, loss: 0.52113, lr: 0.850896, top1: 0.28135, throughput: 312.07 | 2022-04-03 06:51:17.764 [rank:0] [train], epoch: 2/50, iter: 700/834, loss: 0.52354, lr: 0.850896, top1: 0.27583, throughput: 312.12 | 2022-04-03 06:51:17.766 [rank:1] [train], epoch: 2/50, iter: 700/834, loss: 0.52130, lr: 0.850896, top1: 0.27901, throughput: 311.70 | 2022-04-03 06:51:17.790 [rank:2] [train], epoch: 2/50, iter: 700/834, loss: 0.52079, lr: 0.850896, top1: 0.28172, throughput: 311.67 | 2022-04-03 06:51:17.800 [rank:1] [train], epoch: 2/50, iter: 800/834, loss: 0.51393, lr: 0.886830, top1: 0.29781, throughput: 310.95 | 2022-04-03 06:52:19.536 [rank:0] [train], epoch: 2/50, iter: 800/834, loss: 0.51745, lr: 0.886830, top1: 0.28833, throughput: 310.64 | 2022-04-03 06:52:19.574 [rank:4] [train], epoch: 2/50, iter: 800/834, loss: 0.51529, lr: 0.886830, top1: 0.29078, throughput: 310.63 | 2022-04-03 06:52:19.574 [rank:3] [train], epoch: 2/50, iter: 800/834, loss: 0.51752, lr: 0.886830, top1: 0.28885, throughput: 310.36 | 2022-04-03 06:52:19.578 [rank:5] [train], epoch: 2/50, iter: 800/834, loss: 0.51761, lr: 0.886830, top1: 0.29224, throughput: 310.08 | 2022-04-03 06:52:19.581 [rank:2] [train], epoch: 2/50, iter: 800/834, loss: 0.51682, lr: 0.886830, top1: 0.29000, throughput: 310.71 | 2022-04-03 06:52:19.593 [rank:7] [train], epoch: 2/50, iter: 800/834, loss: 0.51429, lr: 0.886830, top1: 0.28880, throughput: 310.35 | 2022-04-03 06:52:19.595 [rank:6] [train], epoch: 2/50, iter: 800/834, loss: 0.51498, lr: 0.886830, top1: 0.28859, throughput: 310.42 | 2022-04-03 06:52:19.598 [rank:0] [train], epoch: 2/50, iter: 834/834, loss: 0.50840, lr: 0.899047, top1: 0.29963, throughput: 311.61 | 2022-04-03 06:52:40.523 [rank:1] [train], epoch: 2/50, iter: 834/834, loss: 0.50754, lr: 0.899047, top1: 0.29810, throughput: 311.01 | 2022-04-03 06:52:40.525 [rank:4] [train], epoch: 2/50, iter: 834/834, loss: 0.51038, lr: 0.899047, top1: 0.30515, throughput: 311.52 | 2022-04-03 06:52:40.530 [rank:6] [train], epoch: 2/50, iter: 834/834, loss: 0.51426, lr: 0.899047, top1: 0.28692, throughput: 311.83 | 2022-04-03 06:52:40.533 [rank:2] [train], epoch: 2/50, iter: 834/834, loss: 0.51186, lr: 0.899047, top1: 0.29320, throughput: 311.74 | 2022-04-03 06:52:40.534 [rank:5] [train], epoch: 2/50, iter: 834/834, loss: 0.51354, lr: 0.899047, top1: 0.29259, throughput: 311.56 | 2022-04-03 06:52:40.534 [rank:3] [train], epoch: 2/50, iter: 834/834, loss: 0.51193, lr: 0.899047, top1: 0.29825, throughput: 311.47 | 2022-04-03 06:52:40.537 [rank:7] [train], epoch: 2/50, iter: 834/834, loss: 0.51292, lr: 0.899047, top1: 0.29534, throughput: 311.70 | 2022-04-03 06:52:40.539 [rank:0] [eval], epoch: 2/50, iter: 125/125, loss: 0.00000, lr: 0.899047, top1: 0.26416, throughput: 483.47 | 2022-04-03 06:52:53.451 [rank:1] [eval], epoch: 2/50, iter: 125/125, loss: 0.00000, lr: 0.899047, top1: 0.26688, throughput: 483.00 | 2022-04-03 06:52:53.465 [rank:2] [eval], epoch: 2/50, iter: 125/125, loss: 0.00000, lr: 0.899047, top1: 0.26736, throughput: 483.29 | 2022-04-03 06:52:53.466 [rank:6] [eval], epoch: 2/50, iter: 125/125, loss: 0.00000, lr: 0.899047, top1: 0.26720, throughput: 483.22 | 2022-04-03 06:52:53.467 [rank:5] [eval], epoch: 2/50, iter: 125/125, loss: 0.00000, lr: 0.899047, top1: 0.25232, throughput: 483.16 | 2022-04-03 06:52:53.469 [rank:4] [eval], epoch: 2/50, iter: 125/125, loss: 0.00000, lr: 0.899047, top1: 0.26256, throughput: 482.95 | 2022-04-03 06:52:53.471 [rank:7] [eval], epoch: 2/50, iter: 125/125, loss: 0.00000, lr: 0.899047, top1: 0.26160, throughput: 482.70 | 2022-04-03 06:52:53.487 [rank:3] [eval], epoch: 2/50, iter: 125/125, loss: 0.00000, lr: 0.899047, top1: 0.25696, throughput: 482.52 | 2022-04-03 06:52:53.490 [rank:7] [train], epoch: 3/50, iter: 100/834, loss: 0.50028, lr: 0.934980, top1: 0.31297, throughput: 312.26 | 2022-04-03 06:53:54.975 [rank:2] [train], epoch: 3/50, iter: 100/834, loss: 0.50385, lr: 0.934980, top1: 0.30672, throughput: 312.04 | 2022-04-03 06:53:54.996 [rank:3] [train], epoch: 3/50, iter: 100/834, loss: 0.50245, lr: 0.934980, top1: 0.30839, throughput: 312.11 | 2022-04-03 06:53:55.008 [rank:0] [train], epoch: 3/50, iter: 100/834, loss: 0.50060, lr: 0.934980, top1: 0.31109, throughput: 311.85 | 2022-04-03 06:53:55.019 [rank:6] [train], epoch: 3/50, iter: 100/834, loss: 0.50285, lr: 0.934980, top1: 0.30818, throughput: 311.93 | 2022-04-03 06:53:55.019 [rank:4] [train], epoch: 3/50, iter: 100/834, loss: 0.50251, lr: 0.934980, top1: 0.30927, throughput: 311.94 | 2022-04-03 06:53:55.021 [rank:5] [train], epoch: 3/50, iter: 100/834, loss: 0.50220, lr: 0.934980, top1: 0.31286, throughput: 311.93 | 2022-04-03 06:53:55.022 [rank:1] [train], epoch: 3/50, iter: 100/834, loss: 0.50217, lr: 0.934980, top1: 0.30823, throughput: 311.65 | 2022-04-03 06:53:55.074 [rank:0] [train], epoch: 3/50, iter: 200/834, loss: 0.49611, lr: 0.970913, top1: 0.31682, throughput: 313.60 | 2022-04-03 06:54:56.244 [rank:5] [train], epoch: 3/50, iter: 200/834, loss: 0.49942, lr: 0.970913, top1: 0.31036, throughput: 313.52 | 2022-04-03 06:54:56.262 [rank:2] [train], epoch: 3/50, iter: 200/834, loss: 0.49771, lr: 0.970913, top1: 0.31823, throughput: 313.28 | 2022-04-03 06:54:56.283 [rank:7] [train], epoch: 3/50, iter: 200/834, loss: 0.49806, lr: 0.970913, top1: 0.31411, throughput: 313.16 | 2022-04-03 06:54:56.285 [rank:3] [train], epoch: 3/50, iter: 200/834, loss: 0.49549, lr: 0.970913, top1: 0.32297, throughput: 313.32 | 2022-04-03 06:54:56.287 [rank:6] [train], epoch: 3/50, iter: 200/834, loss: 0.49290, lr: 0.970913, top1: 0.32130, throughput: 313.31 | 2022-04-03 06:54:56.301 [rank:4] [train], epoch: 3/50, iter: 200/834, loss: 0.49853, lr: 0.970913, top1: 0.31214, throughput: 313.30 | 2022-04-03 06:54:56.305 [rank:1] [train], epoch: 3/50, iter: 200/834, loss: 0.49372, lr: 0.970913, top1: 0.32052, throughput: 313.43 | 2022-04-03 06:54:56.331 [rank:1] [train], epoch: 3/50, iter: 300/834, loss: 0.49085, lr: 1.006846, top1: 0.32620, throughput: 311.21 | 2022-04-03 06:55:58.025 [rank:7] [train], epoch: 3/50, iter: 300/834, loss: 0.49410, lr: 1.006846, top1: 0.31755, throughput: 310.67 | 2022-04-03 06:55:58.087 [rank:6] [train], epoch: 3/50, iter: 300/834, loss: 0.49253, lr: 1.006846, top1: 0.32000, throughput: 310.74 | 2022-04-03 06:55:58.089 [rank:4] [train], epoch: 3/50, iter: 300/834, loss: 0.49060, lr: 1.006846, top1: 0.32750, throughput: 310.66 | 2022-04-03 06:55:58.109 [rank:3] [train], epoch: 3/50, iter: 300/834, loss: 0.49033, lr: 1.006846, top1: 0.33151, throughput: 310.53 | 2022-04-03 06:55:58.116 [rank:5] [train], epoch: 3/50, iter: 300/834, loss: 0.49399, lr: 1.006846, top1: 0.32115, throughput: 310.41 | 2022-04-03 06:55:58.116 [rank:0] [train], epoch: 3/50, iter: 300/834, loss: 0.49400, lr: 1.006846, top1: 0.32724, throughput: 310.31 | 2022-04-03 06:55:58.118 [rank:2] [train], epoch: 3/50, iter: 300/834, loss: 0.49004, lr: 1.006846, top1: 0.32974, throughput: 310.36 | 2022-04-03 06:55:58.147 [rank:1] [train], epoch: 3/50, iter: 400/834, loss: 0.48381, lr: 1.042779, top1: 0.33906, throughput: 311.50 | 2022-04-03 06:56:59.662 [rank:2] [train], epoch: 3/50, iter: 400/834, loss: 0.49050, lr: 1.042779, top1: 0.32708, throughput: 312.02 | 2022-04-03 06:56:59.682 [rank:0] [train], epoch: 3/50, iter: 400/834, loss: 0.48524, lr: 1.042779, top1: 0.33161, throughput: 311.83 | 2022-04-03 06:56:59.689 [rank:6] [train], epoch: 3/50, iter: 400/834, loss: 0.48710, lr: 1.042779, top1: 0.33510, throughput: 311.65 | 2022-04-03 06:56:59.696 [rank:5] [train], epoch: 3/50, iter: 400/834, loss: 0.48550, lr: 1.042779, top1: 0.33328, throughput: 311.78 | 2022-04-03 06:56:59.698 [rank:3] [train], epoch: 3/50, iter: 400/834, loss: 0.48550, lr: 1.042779, top1: 0.33500, throughput: 311.71 | 2022-04-03 06:56:59.712 [rank:4] [train], epoch: 3/50, iter: 400/834, loss: 0.48509, lr: 1.042779, top1: 0.33583, throughput: 311.59 | 2022-04-03 06:56:59.729 [rank:7] [train], epoch: 3/50, iter: 400/834, loss: 0.48476, lr: 1.042779, top1: 0.33594, throughput: 311.41 | 2022-04-03 06:56:59.742 [rank:0] [train], epoch: 3/50, iter: 500/834, loss: 0.48291, lr: 1.078712, top1: 0.34547, throughput: 313.60 | 2022-04-03 06:58:00.913 [rank:2] [train], epoch: 3/50, iter: 500/834, loss: 0.48038, lr: 1.078712, top1: 0.34104, throughput: 313.53 | 2022-04-03 06:58:00.920 [rank:5] [train], epoch: 3/50, iter: 500/834, loss: 0.48023, lr: 1.078712, top1: 0.34099, throughput: 313.55 | 2022-04-03 06:58:00.933 [rank:1] [train], epoch: 3/50, iter: 500/834, loss: 0.48025, lr: 1.078712, top1: 0.34365, throughput: 313.31 | 2022-04-03 06:58:00.943 [rank:7] [train], epoch: 3/50, iter: 500/834, loss: 0.48156, lr: 1.078712, top1: 0.33995, throughput: 313.57 | 2022-04-03 06:58:00.972 [rank:4] [train], epoch: 3/50, iter: 500/834, loss: 0.47958, lr: 1.078712, top1: 0.34771, throughput: 313.50 | 2022-04-03 06:58:00.973 [rank:6] [train], epoch: 3/50, iter: 500/834, loss: 0.48272, lr: 1.078712, top1: 0.33839, throughput: 313.30 | 2022-04-03 06:58:00.979 [rank:3] [train], epoch: 3/50, iter: 500/834, loss: 0.48160, lr: 1.078712, top1: 0.34198, throughput: 313.33 | 2022-04-03 06:58:00.988 [rank:5] [train], epoch: 3/50, iter: 600/834, loss: 0.47707, lr: 1.114646, top1: 0.34865, throughput: 312.65 | 2022-04-03 06:59:02.344 [rank:0] [train], epoch: 3/50, iter: 600/834, loss: 0.47468, lr: 1.114646, top1: 0.35214, throughput: 312.36 | 2022-04-03 06:59:02.381 [rank:3] [train], epoch: 3/50, iter: 600/834, loss: 0.47969, lr: 1.114646, top1: 0.34276, throughput: 312.72[rank:6] [train], epoch: 3/50, iter: 600/834, loss: 0.47561, lr: 1.114646, top1: 0.35125, throughput: 312.67 | 2022-04-03 06:59:02.385| 2022-04-03 06:59:02.385 [rank:4] [train], epoch: 3/50, iter: 600/834, loss: 0.47805, lr: 1.114646, top1: 0.34578, throughput: 312.59 | 2022-04-03 06:59:02.395 [rank:2] [train], epoch: 3/50, iter: 600/834, loss: 0.47497, lr: 1.114646, top1: 0.35099, throughput: 312.22 | 2022-04-03 06:59:02.414 [rank:1] [train], epoch: 3/50, iter: 600/834, loss: 0.47431, lr: 1.114646, top1: 0.35276, throughput: 312.28 | 2022-04-03 06:59:02.425 [rank:7] [train], epoch: 3/50, iter: 600/834, loss: 0.47390, lr: 1.114646, top1: 0.35630, throughput: 312.32 | 2022-04-03 06:59:02.446 [rank:4] [train], epoch: 3/50, iter: 700/834, loss: 0.47445, lr: 1.150579, top1: 0.35198, throughput: 313.31 | 2022-04-03 07:00:03.677 [rank:0] [train], epoch: 3/50, iter: 700/834, loss: 0.47370, lr: 1.150579, top1: 0.35349, throughput: 313.23 | 2022-04-03 07:00:03.678 [rank:1] [train], epoch: 3/50, iter: 700/834, loss: 0.47027, lr: 1.150579, top1: 0.35948, throughput: 313.37 | 2022-04-03 07:00:03.695 [rank:5] [train], epoch: 3/50, iter: 700/834, loss: 0.47098, lr: 1.150579, top1: 0.35786, throughput: 312.94 | 2022-04-03 07:00:03.697 [rank:6] [train], epoch: 3/50, iter: 700/834, loss: 0.47196, lr: 1.150579, top1: 0.36078, throughput: 313.04 | 2022-04-03 07:00:03.719 [rank:7] [train], epoch: 3/50, iter: 700/834, loss: 0.47198, lr: 1.150579, top1: 0.35661, throughput: 313.30 | 2022-04-03 07:00:03.730 [rank:2] [train], epoch: 3/50, iter: 700/834, loss: 0.47152, lr: 1.150579, top1: 0.35682, throughput: 313.07 | 2022-04-03 07:00:03.742 [rank:3] [train], epoch: 3/50, iter: 700/834, loss: 0.47117, lr: 1.150579, top1: 0.35568, throughput: 313.35 | 2022-04-03 07:00:03.658 [rank:1] [train], epoch: 3/50, iter: 800/834, loss: 0.46672, lr: 1.186512, top1: 0.36437, throughput: 312.49 | 2022-04-03 07:01:05.136 [rank:3] [train], epoch: 3/50, iter: 800/834, loss: 0.46846, lr: 1.186512, top1: 0.36125, throughput: 312.25 | 2022-04-03 07:01:05.148 [rank:7] [train], epoch: 3/50, iter: 800/834, loss: 0.46880, lr: 1.186512, top1: 0.36120, throughput: 312.54 | 2022-04-03 07:01:05.162 [rank:4] [train], epoch: 3/50, iter: 800/834, loss: 0.46898, lr: 1.186512, top1: 0.36099, throughput: 312.12 | 2022-04-03 07:01:05.193 [rank:0] [train], epoch: 3/50, iter: 800/834, loss: 0.46788, lr: 1.186512, top1: 0.36188, throughput: 312.12 | 2022-04-03 07:01:05.193 [rank:6] [train], epoch: 3/50, iter: 800/834, loss: 0.46703, lr: 1.186512, top1: 0.36333, throughput: 312.74 | 2022-04-03 07:01:05.111 [rank:2] [train], epoch: 3/50, iter: 800/834, loss: 0.46958, lr: 1.186512, top1: 0.36740, throughput: 312.86 | 2022-04-03 07:01:05.111 [rank:5] [train], epoch: 3/50, iter: 800/834, loss: 0.46554, lr: 1.186512, top1: 0.36797, throughput: 312.57 | 2022-04-03 07:01:05.122 [rank:7] [train], epoch: 3/50, iter: 834/834, loss: 0.46296, lr: 1.198729, top1: 0.37086, throughput: 314.76 | 2022-04-03 07:01:25.902 [rank:1] [train], epoch: 3/50, iter: 834/834, loss: 0.46564, lr: 1.198729, top1: 0.36259, throughput: 314.27 | 2022-04-03 07:01:25.908 [rank:6] [train], epoch: 3/50, iter: 834/834, loss: 0.46595, lr: 1.198729, top1: 0.36979, throughput: 313.90 | 2022-04-03 07:01:25.908 [rank:3] [train], epoch: 3/50, iter: 834/834, loss: 0.46409, lr: 1.198729, top1: 0.36382, throughput: 314.22 | 2022-04-03 07:01:25.923 [rank:2] [train], epoch: 3/50, iter: 834/834, loss: 0.46218, lr: 1.198729, top1: 0.37469, throughput: 313.36 | 2022-04-03 07:01:25.943 [rank:0] [train], epoch: 3/50, iter: 834/834, loss: 0.45959, lr: 1.198729, top1: 0.37607, throughput: 314.48 | 2022-04-03 07:01:25.951 [rank:5] [train], epoch: 3/50, iter: 834/834, loss: 0.46187, lr: 1.198729, top1: 0.37301, throughput: 313.33 | 2022-04-03 07:01:25.956 [rank:4] [train], epoch: 3/50, iter: 834/834, loss: 0.46193, lr: 1.198729, top1: 0.37623, throughput: 313.94 | 2022-04-03 07:01:25.986 [rank:0] [eval], epoch: 3/50, iter: 125/125, loss: 0.00000, lr: 1.198729, top1: 0.35376, throughput: 483.51 | 2022-04-03 07:01:38.878 [rank:5] [eval], epoch: 3/50, iter: 125/125, loss: 0.00000, lr: 1.198729, top1: 0.33200, throughput: 483.51 | 2022-04-03 07:01:38.883 [rank:6] [eval], epoch: 3/50, iter: 125/125, loss: 0.00000, lr: 1.198729, top1: 0.34064, throughput: 481.66 | 2022-04-03 07:01:38.884 [rank:2] [eval], epoch: 3/50, iter: 125/125, loss: 0.00000, lr: 1.198729, top1: 0.35472, throughput: 482.89 | 2022-04-03 07:01:38.886 [rank:1] [eval], epoch: 3/50, iter: 125/125, loss: 0.00000, lr: 1.198729, top1: 0.34704, throughput: 481.48 | 2022-04-03 07:01:38.889 [rank:7] [eval], epoch: 3/50, iter: 125/125, loss: 0.00000, lr: 1.198729, top1: 0.34928, throughput: 481.21 | 2022-04-03 07:01:38.890 [rank:4] [eval], epoch: 3/50, iter: 125/125, loss: 0.00000, lr: 1.198729, top1: 0.34112, throughput: 484.33 | 2022-04-03 07:01:38.891 [rank:3] [eval], epoch: 3/50, iter: 125/125, loss: 0.00000, lr: 1.198729, top1: 0.35072, throughput: 480.34 | 2022-04-03 07:01:38.935 [rank:3] [train], epoch: 4/50, iter: 100/834, loss: 0.45308, lr: 1.234662, top1: 0.38714, throughput: 313.88 | 2022-04-03 07:02:40.104 [rank:0] [train], epoch: 4/50, iter: 100/834, loss: 0.45930, lr: 1.234662, top1: 0.38281, throughput: 313.50 | 2022-04-03 07:02:40.122 [rank:4] [train], epoch: 4/50, iter: 100/834, loss: 0.46005, lr: 1.234662, top1: 0.37406, throughput: 313.46 | 2022-04-03 07:02:40.142 [rank:2] [train], epoch: 4/50, iter: 100/834, loss: 0.45494, lr: 1.234662, top1: 0.38620, throughput: 313.41 | 2022-04-03 07:02:40.147 [rank:5] [train], epoch: 4/50, iter: 100/834, loss: 0.45473, lr: 1.234662, top1: 0.38391, throughput: 313.31 | 2022-04-03 07:02:40.165 [rank:1] [train], epoch: 4/50, iter: 100/834, loss: 0.45729, lr: 1.234662, top1: 0.38068, throughput: 313.31 | 2022-04-03 07:02:40.169 [rank:6] [train], epoch: 4/50, iter: 100/834, loss: 0.46187, lr: 1.234662, top1: 0.37396, throughput: 313.19 | 2022-04-03 07:02:40.188 [rank:7] [train], epoch: 4/50, iter: 100/834, loss: 0.45920, lr: 1.234662, top1: 0.37536, throughput: 313.67 | 2022-04-03 07:02:40.100 [rank:2] [train], epoch: 4/50, iter: 200/834, loss: 0.45427, lr: 1.270595, top1: 0.38198, throughput: 313.10 | 2022-04-03 07:03:41.469 [rank:1] [train], epoch: 4/50, iter: 200/834, loss: 0.45585, lr: 1.270595, top1: 0.38016, throughput: 313.18 | 2022-04-03 07:03:41.476 [rank:4] [train], epoch: 4/50, iter: 200/834, loss: 0.45591, lr: 1.270595, top1: 0.38151, throughput: 313.01 | 2022-04-03 07:03:41.481 [rank:7] [train], epoch: 4/50, iter: 200/834, loss: 0.45465, lr: 1.270595, top1: 0.38328, throughput: 312.74 | 2022-04-03 07:03:41.493 [rank:5] [train], epoch: 4/50, iter: 200/834, loss: 0.45666, lr: 1.270595, top1: 0.37458, throughput: 313.04 | 2022-04-03 07:03:41.499 [rank:6] [train], epoch: 4/50, iter: 200/834, loss: 0.45784, lr: 1.270595, top1: 0.37818, throughput: 313.05 | 2022-04-03 07:03:41.519 [rank:0] [train], epoch: 4/50, iter: 200/834, loss: 0.45625, lr: 1.270595, top1: 0.37938, throughput: 312.60 | 2022-04-03 07:03:41.542 [rank:3] [train], epoch: 4/50, iter: 200/834, loss: 0.45604, lr: 1.270595, top1: 0.38073, throughput: 312.37 | 2022-04-03 07:03:41.570 [rank:6] [train], epoch: 4/50, iter: 300/834, loss: 0.45175, lr: 1.306529, top1: 0.38531, throughput: 312.69 | 2022-04-03 07:04:42.922 [rank:7] [train], epoch: 4/50, iter: 300/834, loss: 0.45123, lr: 1.306529, top1: 0.39333, throughput: 312.47 | 2022-04-03 07:04:42.939 [rank:1] [train], epoch: 4/50, iter: 300/834, loss: 0.44857, lr: 1.306529, top1: 0.39484, throughput: 312.28 | 2022-04-03 07:04:42.960 [rank:0] [train], epoch: 4/50, iter: 300/834, loss: 0.45051, lr: 1.306529, top1: 0.39271, throughput: 312.59 | 2022-04-03 07:04:42.965 [rank:2] [train], epoch: 4/50, iter: 300/834, loss: 0.45119, lr: 1.306529, top1: 0.38807, throughput: 312.21 | 2022-04-03 07:04:42.966 [rank:4] [train], epoch: 4/50, iter: 300/834, loss: 0.44984, lr: 1.306529, top1: 0.38760, throughput: 312.27 | 2022-04-03 07:04:42.967 [rank:5] [train], epoch: 4/50, iter: 300/834, loss: 0.44865, lr: 1.306529, top1: 0.39375, throughput: 312.20 | 2022-04-03 07:04:42.998 [rank:3] [train], epoch: 4/50, iter: 300/834, loss: 0.45028, lr: 1.306529, top1: 0.39089, throughput: 312.56 | 2022-04-03 07:04:42.998 [rank:7] [train], epoch: 4/50, iter: 400/834, loss: 0.44786, lr: 1.342462, top1: 0.39417, throughput: 312.14 | 2022-04-03 07:05:44.450 [rank:3] [train], epoch: 4/50, iter: 400/834, loss: 0.44781, lr: 1.342462, top1: 0.39354, throughput: 312.27 | 2022-04-03 07:05:44.482 [rank:5] [train], epoch: 4/50, iter: 400/834, loss: 0.44840, lr: 1.342462, top1: 0.39458, throughput: 312.24 | 2022-04-03 07:05:44.489 [rank:0] [train], epoch: 4/50, iter: 400/834, loss: 0.45332, lr: 1.342462, top1: 0.38615, throughput: 312.06 | 2022-04-03 07:05:44.492 [rank:2] [train], epoch: 4/50, iter: 400/834, loss: 0.45081, lr: 1.342462, top1: 0.39104, throughput: 312.05 | 2022-04-03 07:05:44.494 [rank:6] [train], epoch: 4/50, iter: 400/834, loss: 0.44822, lr: 1.342462, top1: 0.39656, throughput: 311.79 | 2022-04-03 07:05:44.501 [rank:1] [train], epoch: 4/50, iter: 400/834, loss: 0.44909, lr: 1.342462, top1: 0.39599, throughput: 311.86 | 2022-04-03 07:05:44.526 [rank:4] [train], epoch: 4/50, iter: 400/834, loss: 0.45025, lr: 1.342462, top1: 0.38891, throughput: 311.80 | 2022-04-03 07:05:44.545 [rank:0] [train], epoch: 4/50, iter: 500/834, loss: 0.44507, lr: 1.378395, top1: 0.39760, throughput: 312.71 | 2022-04-03 07:06:45.890 [rank:2] [train], epoch: 4/50, iter: 500/834, loss: 0.44503, lr: 1.378395, top1: 0.40130, throughput: 312.71 | 2022-04-03 07:06:45.892 [rank:5] [train], epoch: 4/50, iter: 500/834, loss: 0.44358, lr: 1.378395, top1: 0.40161, throughput: 312.21 | 2022-04-03 07:06:45.986 [rank:7] [train], epoch: 4/50, iter: 500/834, loss: 0.44572, lr: 1.378395, top1: 0.39839, throughput: 312.00 | 2022-04-03 07:06:45.988 [rank:6] [train], epoch: 4/50, iter: 500/834, loss: 0.44536, lr: 1.378395, top1: 0.39437, throughput: 312.23 | 2022-04-03 07:06:45.994 [rank:3] [train], epoch: 4/50, iter: 500/834, loss: 0.44308, lr: 1.378395, top1: 0.40292, throughput: 312.08 | 2022-04-03 07:06:46.005 [rank:1] [train], epoch: 4/50, iter: 500/834, loss: 0.44555, lr: 1.378395, top1: 0.39260, throughput: 312.14 | 2022-04-03 07:06:46.037 [rank:4] [train], epoch: 4/50, iter: 500/834, loss: 0.44470, lr: 1.378395, top1: 0.40078, throughput: 312.18 | 2022-04-03 07:06:46.047 [rank:0] [train], epoch: 4/50, iter: 600/834, loss: 0.44432, lr: 1.414328, top1: 0.39823, throughput: 312.11 | 2022-04-03 07:07:47.406 [rank:7] [train], epoch: 4/50, iter: 600/834, loss: 0.44330, lr: 1.414328, top1: 0.39932, throughput: 312.42 | 2022-04-03 07:07:47.443 [rank:4] [train], epoch: 4/50, iter: 600/834, loss: 0.44275, lr: 1.414328, top1: 0.40021, throughput: 312.61 | 2022-04-03 07:07:47.466 [rank:2] [train], epoch: 4/50, iter: 600/834, loss: 0.44566, lr: 1.414328, top1: 0.39953, throughput: 311.80 | 2022-04-03 07:07:47.470 [rank:5] [train], epoch: 4/50, iter: 600/834, loss: 0.44472, lr: 1.414328, top1: 0.39599, throughput: 312.24 | 2022-04-03 07:07:47.478 [rank:6] [train], epoch: 4/50, iter: 600/834, loss: 0.44216, lr: 1.414328, top1: 0.40401, throughput: 312.26 | 2022-04-03 07:07:47.482 [rank:3] [train], epoch: 4/50, iter: 600/834, loss: 0.43985, lr: 1.414328, top1: 0.40594, throughput: 312.22 | 2022-04-03 07:07:47.500 [rank:1] [train], epoch: 4/50, iter: 600/834, loss: 0.43865, lr: 1.414328, top1: 0.40917, throughput: 312.37 | 2022-04-03 07:07:47.503 [rank:5] [train], epoch: 4/50, iter: 700/834, loss: 0.43972, lr: 1.450261, top1: 0.40396, throughput: 311.40 | 2022-04-03 07:08:49.135 [rank:7] [train], epoch: 4/50, iter: 700/834, loss: 0.44217, lr: 1.450261, top1: 0.39974, throughput: 311.07 | 2022-04-03 07:08:49.166 [rank:4] [train], epoch: 4/50, iter: 700/834, loss: 0.44150, lr: 1.450261, top1: 0.39964, throughput: 311.14 | 2022-04-03 07:08:49.175 [rank:2] [train], epoch: 4/50, iter: 700/834, loss: 0.43772, lr: 1.450261, top1: 0.40974, throughput: 311.14 | 2022-04-03 07:08:49.179 [rank:0] [train], epoch: 4/50, iter: 700/834, loss: 0.43896, lr: 1.450261, top1: 0.40781, throughput: 310.70 | 2022-04-03 07:08:49.202 [rank:6] [train], epoch: 4/50, iter: 700/834, loss: 0.44423, lr: 1.450261, top1: 0.40057, throughput: 311.04 | 2022-04-03 07:08:49.211 [rank:3] [train], epoch: 4/50, iter: 700/834, loss: 0.43964, lr: 1.450261, top1: 0.40531, throughput: 311.08 | 2022-04-03 07:08:49.221 [rank:1] [train], epoch: 4/50, iter: 700/834, loss: 0.44295, lr: 1.450261, top1: 0.40083, throughput: 311.08 | 2022-04-03 07:08:49.224 [rank:7] [train], epoch: 4/50, iter: 800/834, loss: 0.43804, lr: 1.486194, top1: 0.40745, throughput: 313.81 | 2022-04-03 07:09:50.349 [rank:2] [train], epoch: 4/50, iter: 800/834, loss: 0.43697, lr: 1.486194, top1: 0.41167, throughput: 313.87 | 2022-04-03 07:09:50.350 [rank:6] [train], epoch: 4/50, iter: 800/834, loss: 0.43739, lr: 1.486194, top1: 0.40755, throughput: 313.94 | 2022-04-03 07:09:50.369 [rank:1] [train], epoch: 4/50, iter: 800/834, loss: 0.43909, lr: 1.486194, top1: 0.40656, throughput: 313.95 | 2022-04-03 07:09:50.380 [rank:5] [train], epoch: 4/50, iter: 800/834, loss: 0.43574, lr: 1.486194, top1: 0.41458, throughput: 313.46 | 2022-04-03 07:09:50.386 [rank:0] [train], epoch: 4/50, iter: 800/834, loss: 0.43874, lr: 1.486194, top1: 0.40510, throughput: 313.75 | 2022-04-03 07:09:50.398 [rank:4] [train], epoch: 4/50, iter: 800/834, loss: 0.43612, lr: 1.486194, top1: 0.41281, throughput: 313.48 | 2022-04-03 07:09:50.422 [rank:3] [train], epoch: 4/50, iter: 800/834, loss: 0.43943, lr: 1.486194, top1: 0.40406, throughput: 313.65 | 2022-04-03 07:09:50.435 [rank:1] [train], epoch: 4/50, iter: 834/834, loss: 0.43529, lr: 1.498411, top1: 0.40916, throughput: 312.90 | 2022-04-03 07:10:11.243 [rank:7] [train], epoch: 4/50, iter: 834/834, loss: 0.43627, lr: 1.498411, top1: 0.40717, throughput: 312.34 | 2022-04-03 07:10:11.250 [rank:6] [train], epoch: 4/50, iter: 834/834, loss: 0.43400, lr: 1.498411, top1: 0.41268, throughput: 312.62 | 2022-04-03 07:10:11.251 [rank:5] [train], epoch: 4/50, iter: 834/834, loss: 0.43990, lr: 1.498411, top1: 0.40518, throughput: 312.86 | 2022-04-03 07:10:11.252 [rank:4] [train], epoch: 4/50, iter: 834/834, loss: 0.43478, lr: 1.498411, top1: 0.41115, throughput: 313.40 | 2022-04-03 07:10:11.252 [rank:3] [train], epoch: 4/50, iter: 834/834, loss: 0.43978, lr: 1.498411, top1: 0.41161, throughput: 313.55 | 2022-04-03 07:10:11.255 [rank:0] [train], epoch: 4/50, iter: 834/834, loss: 0.43672, lr: 1.498411, top1: 0.41422, throughput: 312.41 | 2022-04-03 07:10:11.294 [rank:2] [train], epoch: 4/50, iter: 834/834, loss: 0.43585, lr: 1.498411, top1: 0.40456, throughput: 311.56 | 2022-04-03 07:10:11.302 [rank:0] [eval], epoch: 4/50, iter: 125/125, loss: 0.00000, lr: 1.498411, top1: 0.37568, throughput: 486.38 | 2022-04-03 07:10:24.144 [rank:2] [eval], epoch: 4/50, iter: 125/125, loss: 0.00000, lr: 1.498411, top1: 0.37712, throughput: 486.46 | 2022-04-03 07:10:24.150 [rank:7] [eval], epoch: 4/50, iter: 125/125, loss: 0.00000, lr: 1.498411, top1: 0.37680, throughput: 484.38 | 2022-04-03 07:10:24.153 [rank:4] [eval], epoch: 4/50, iter: 125/125, loss: 0.00000, lr: 1.498411, top1: 0.36464, throughput: 484.37 | 2022-04-03 07:10:24.155 [rank:6] [eval], epoch: 4/50, iter: 125/125, loss: 0.00000, lr: 1.498411, top1: 0.36832, throughput: 484.20 | 2022-04-03 07:10:24.159 [rank:5] [eval], epoch: 4/50, iter: 125/125, loss: 0.00000, lr: 1.498411, top1: 0.35136, throughput: 483.94 | 2022-04-03 07:10:24.167 [rank:1] [eval], epoch: 4/50, iter: 125/125, loss: 0.00000, lr: 1.498411, top1: 0.37408, throughput: 483.57 | 2022-04-03 07:10:24.168 [rank:3] [eval], epoch: 4/50, iter: 125/125, loss: 0.00000, lr: 1.498411, top1: 0.36352, throughput: 482.81 | 2022-04-03 07:10:24.200 [rank:1] [train], epoch: 5/50, iter: 100/834, loss: 0.42825, lr: 1.496603, top1: 0.42552, throughput: 312.04 | 2022-04-03 07:11:25.699 [rank:0] [train], epoch: 5/50, iter: 100/834, loss: 0.42974, lr: 1.496603, top1: 0.41969, throughput: 311.84 | 2022-04-03 07:11:25.713 [rank:3] [train], epoch: 5/50, iter: 100/834, loss: 0.43090, lr: 1.496603, top1: 0.42344, throughput: 312.03 | 2022-04-03 07:11:25.733 [rank:5] [train], epoch: 5/50, iter: 100/834, loss: 0.42805, lr: 1.496603, top1: 0.42010, throughput: 311.83 | 2022-04-03 07:11:25.740 [rank:7] [train], epoch: 5/50, iter: 100/834, loss: 0.42827, lr: 1.496603, top1: 0.42651, throughput: 311.72 | 2022-04-03 07:11:25.747 [rank:2] [train], epoch: 5/50, iter: 100/834, loss: 0.43068, lr: 1.496603, top1: 0.41943, throughput: 311.66 | 2022-04-03 07:11:25.756 [rank:4] [train], epoch: 5/50, iter: 100/834, loss: 0.43256, lr: 1.496603, top1: 0.41797, throughput: 311.58 | 2022-04-03 07:11:25.777 [rank:6] [train], epoch: 5/50, iter: 100/834, loss: 0.42914, lr: 1.496603, top1: 0.42365, throughput: 312.04 | 2022-04-03 07:11:25.689 [rank:3] [train], epoch: 5/50, iter: 200/834, loss: 0.42531, lr: 1.494753, top1: 0.42891, throughput: 311.22 | 2022-04-03 07:12:27.426 [rank:7] [train], epoch: 5/50, iter: 200/834, loss: 0.43000, lr: 1.494753, top1: 0.42182, throughput: 311.14 | 2022-04-03 07:12:27.455 [rank:1] [train], epoch: 5/50, iter: 200/834, loss: 0.43003, lr: 1.494753, top1: 0.42125, throughput: 310.90 | 2022-04-03 07:12:27.455 [rank:4] [train], epoch: 5/50, iter: 200/834, loss: 0.42605, lr: 1.494753, top1: 0.43021, throughput: 311.27 | 2022-04-03 07:12:27.460 [rank:0] [train], epoch: 5/50, iter: 200/834, loss: 0.42612, lr: 1.494753, top1: 0.42599, throughput: 310.72 | 2022-04-03 07:12:27.506 [rank:6] [train], epoch: 5/50, iter: 200/834, loss: 0.42740, lr: 1.494753, top1: 0.42906, throughput: 310.59 | 2022-04-03 07:12:27.506 [rank:5] [train], epoch: 5/50, iter: 200/834, loss: 0.42796, lr: 1.494753, top1: 0.42906, throughput: 310.80 | 2022-04-03 07:12:27.515 [rank:2] [train], epoch: 5/50, iter: 200/834, loss: 0.42941, lr: 1.494753, top1: 0.42083, throughput: 310.84 | 2022-04-03 07:12:27.524 [rank:3] [train], epoch: 5/50, iter: 300/834, loss: 0.42532, lr: 1.492861, top1: 0.42964, throughput: 312.98 | 2022-04-03 07:13:28.771 [rank:1] [train], epoch: 5/50, iter: 300/834, loss: 0.42576, lr: 1.492861, top1: 0.42875, throughput: 313.02 | 2022-04-03 07:13:28.793 [rank:4] [train], epoch: 5/50, iter: 300/834, loss: 0.42231, lr: 1.492861, top1: 0.43583, throughput: 313.04 | 2022-04-03 07:13:28.794 [rank:7] [train], epoch: 5/50, iter: 300/834, loss: 0.42529, lr: 1.492861, top1: 0.42594, throughput: 313.01 | 2022-04-03 07:13:28.794 [rank:6] [train], epoch: 5/50, iter: 300/834, loss: 0.42519, lr: 1.492861, top1: 0.42776, throughput: 313.24 | 2022-04-03 07:13:28.800 [rank:0] [train], epoch: 5/50, iter: 300/834, loss: 0.42741, lr: 1.492861, top1: 0.42380, throughput: 313.18 | 2022-04-03 07:13:28.812 [rank:2] [train], epoch: 5/50, iter: 300/834, loss: 0.42735, lr: 1.492861, top1: 0.42578, throughput: 313.27 | 2022-04-03 07:13:28.812 [rank:5] [train], epoch: 5/50, iter: 300/834, loss: 0.42471, lr: 1.492861, top1: 0.42818, throughput: 313.21 | 2022-04-03 07:13:28.815 [rank:1] [train], epoch: 5/50, iter: 400/834, loss: 0.42111, lr: 1.490929, top1: 0.43839, throughput: 312.46 | 2022-04-03 07:14:30.241 [rank:4] [train], epoch: 5/50, iter: 400/834, loss: 0.42222, lr: 1.490929, top1: 0.42948, throughput: 312.44 | 2022-04-03 07:14:30.245 [rank:7] [train], epoch: 5/50, iter: 400/834, loss: 0.42146, lr: 1.490929, top1: 0.43823, throughput: 312.41 | 2022-04-03 07:14:30.252 [rank:6] [train], epoch: 5/50, iter: 400/834, loss: 0.42290, lr: 1.490929, top1: 0.43146, throughput: 312.39 | 2022-04-03 07:14:30.262 [rank:2] [train], epoch: 5/50, iter: 400/834, loss: 0.41981, lr: 1.490929, top1: 0.43203, throughput: 312.36 | 2022-04-03 07:14:30.280 [rank:3] [train], epoch: 5/50, iter: 400/834, loss: 0.42146, lr: 1.490929, top1: 0.43339, throughput: 312.15 | 2022-04-03 07:14:30.280 [rank:0] [train], epoch: 5/50, iter: 400/834, loss: 0.42075, lr: 1.490929, top1: 0.43339, throughput: 312.32 | 2022-04-03 07:14:30.286 [rank:5] [train], epoch: 5/50, iter: 400/834, loss: 0.42243, lr: 1.490929, top1: 0.43083, throughput: 312.15 | 2022-04-03 07:14:30.323 [rank:0] [train], epoch: 5/50, iter: 500/834, loss: 0.41792, lr: 1.488956, top1: 0.44240, throughput: 312.92 | 2022-04-03 07:15:31.643 [rank:3] [train], epoch: 5/50, iter: 500/834, loss: 0.41931, lr: 1.488956, top1: 0.44021, throughput: 312.82 | 2022-04-03 07:15:31.657 [rank:6] [train], epoch: 5/50, iter: 500/834, loss: 0.42021, lr: 1.488956, top1: 0.43802, throughput: 312.65 | 2022-04-03 07:15:31.673 [rank:5] [train], epoch: 5/50, iter: 500/834, loss: 0.41897, lr: 1.488956, top1: 0.44510, throughput: 312.86 | 2022-04-03 07:15:31.692 [rank:2] [train], epoch: 5/50, iter: 500/834, loss: 0.41872, lr: 1.488956, top1: 0.43667, throughput: 312.62 | 2022-04-03 07:15:31.696 [rank:1] [train], epoch: 5/50, iter: 500/834, loss: 0.41901, lr: 1.488956, top1: 0.43917, throughput: 312.38 | 2022-04-03 07:15:31.704 [rank:7] [train], epoch: 5/50, iter: 500/834, loss: 0.41659, lr: 1.488956, top1: 0.44630, throughput: 312.38 | 2022-04-03 07:15:31.716 [rank:4] [train], epoch: 5/50, iter: 500/834, loss: 0.41909, lr: 1.488956, top1: 0.43464, throughput: 312.26 | 2022-04-03 07:15:31.732 [rank:6] [train], epoch: 5/50, iter: 600/834, loss: 0.41654, lr: 1.486941, top1: 0.43885, throughput: 311.74 | 2022-04-03 07:16:33.263 [rank:0] [train], epoch: 5/50, iter: 600/834, loss: 0.41748, lr: 1.486941, top1: 0.44266, throughput: 311.56 | 2022-04-03 07:16:33.268 [rank:1] [train], epoch: 5/50, iter: 600/834, loss: 0.41685, lr: 1.486941, top1: 0.44365, throughput: 311.78 | 2022-04-03 07:16:33.285 [rank:5] [train], epoch: 5/50, iter: 600/834, loss: 0.41557, lr: 1.486941, top1: 0.44630, throughput: 311.69 | 2022-04-03 07:16:33.292 [rank:7] [train], epoch: 5/50, iter: 600/834, loss: 0.41665, lr: 1.486941, top1: 0.44656, throughput: 311.74 | 2022-04-03 07:16:33.305 [rank:2] [train], epoch: 5/50, iter: 600/834, loss: 0.42053, lr: 1.486941, top1: 0.43578, throughput: 311.58 | 2022-04-03 07:16:33.318 [rank:3] [train], epoch: 5/50, iter: 600/834, loss: 0.41833, lr: 1.486941, top1: 0.44432, throughput: 311.37 | 2022-04-03 07:16:33.320 [rank:4] [train], epoch: 5/50, iter: 600/834, loss: 0.41948, lr: 1.486941, top1: 0.43594, throughput: 311.70 | 2022-04-03 07:16:33.329 [rank:7] [train], epoch: 5/50, iter: 700/834, loss: 0.41841, lr: 1.484886, top1: 0.43563, throughput: 312.97 | 2022-04-03 07:17:34.654 [rank:3] [train], epoch: 5/50, iter: 700/834, loss: 0.41542, lr: 1.484886, top1: 0.44536, throughput: 313.03 | 2022-04-03 07:17:34.656 [rank:5] [train], epoch: 5/50, iter: 700/834, loss: 0.41622, lr: 1.484886, top1: 0.43932, throughput: 312.87 | 2022-04-03 07:17:34.660 [rank:2] [train], epoch: 5/50, iter: 700/834, loss: 0.41539, lr: 1.484886, top1: 0.44469, throughput: 312.97 | 2022-04-03 07:17:34.666 [rank:6] [train], epoch: 5/50, iter: 700/834, loss: 0.41718, lr: 1.484886, top1: 0.44208, throughput: 312.50 | 2022-04-03 07:17:34.703 [rank:0] [train], epoch: 5/50, iter: 700/834, loss: 0.41672, lr: 1.484886, top1: 0.43708, throughput: 312.51 | 2022-04-03 07:17:34.707 [rank:4] [train], epoch: 5/50, iter: 700/834, loss: 0.41218, lr: 1.484886, top1: 0.44990, throughput: 312.82 | 2022-04-03 07:17:34.707 [rank:1] [train], epoch: 5/50, iter: 700/834, loss: 0.41455, lr: 1.484886, top1: 0.44646, throughput: 312.59 | 2022-04-03 07:17:34.707 [rank:0] [train], epoch: 5/50, iter: 800/834, loss: 0.41216, lr: 1.482790, top1: 0.44974, throughput: 312.45 | 2022-04-03 07:18:36.157 [rank:7] [train], epoch: 5/50, iter: 800/834, loss: 0.41093, lr: 1.482790, top1: 0.45495, throughput: 312.11 | 2022-04-03 07:18:36.171 [rank:5] [train], epoch: 5/50, iter: 800/834, loss: 0.41223, lr: 1.482790, top1: 0.45016, throughput: 312.04 | 2022-04-03 07:18:36.191 [rank:2] [train], epoch: 5/50, iter: 800/834, loss: 0.41339, lr: 1.482790, top1: 0.44620, throughput: 312.05 | 2022-04-03 07:18:36.194 [rank:1] [train], epoch: 5/50, iter: 800/834, loss: 0.41378, lr: 1.482790, top1: 0.45135, throughput: 312.22 | 2022-04-03 07:18:36.203 [rank:6] [train], epoch: 5/50, iter: 800/834, loss: 0.41242, lr: 1.482790, top1: 0.45094, throughput: 312.13 | 2022-04-03 07:18:36.215 [rank:3] [train], epoch: 5/50, iter: 800/834, loss: 0.41619, lr: 1.482790, top1: 0.44354, throughput: 311.73 | 2022-04-03 07:18:36.247 [rank:4] [train], epoch: 5/50, iter: 800/834, loss: 0.41489, lr: 1.482790, top1: 0.44661, throughput: 312.45 | 2022-04-03 07:18:36.156 [rank:6] [train], epoch: 5/50, iter: 834/834, loss: 0.41004, lr: 1.482068, top1: 0.45021, throughput: 310.45 | 2022-04-03 07:18:57.243 [rank:2] [train], epoch: 5/50, iter: 834/834, loss: 0.41251, lr: 1.482068, top1: 0.45006, throughput: 310.10 | 2022-04-03 07:18:57.246 [rank:4] [train], epoch: 5/50, iter: 834/834, loss: 0.41435, lr: 1.482068, top1: 0.44853, throughput: 309.49 | 2022-04-03 07:18:57.249 [rank:0] [train], epoch: 5/50, iter: 834/834, loss: 0.40948, lr: 1.482068, top1: 0.46002, throughput: 309.46 | 2022-04-03 07:18:57.252 [rank:7] [train], epoch: 5/50, iter: 834/834, loss: 0.41135, lr: 1.482068, top1: 0.45404, throughput: 309.61 | 2022-04-03 07:18:57.256 [rank:3] [train], epoch: 5/50, iter: 834/834, loss: 0.41030, lr: 1.482068, top1: 0.45496, throughput: 310.43 | 2022-04-03 07:18:57.277 [rank:1] [train], epoch: 5/50, iter: 834/834, loss: 0.40848, lr: 1.482068, top1: 0.45634, throughput: 309.76 | 2022-04-03 07:18:57.277 [rank:5] [train], epoch: 5/50, iter: 834/834, loss: 0.41195, lr: 1.482068, top1: 0.45236, throughput: 309.31 | 2022-04-03 07:18:57.296 [rank:0] [eval], epoch: 5/50, iter: 125/125, loss: 0.00000, lr: 1.482068, top1: 0.44192, throughput: 484.09 | 2022-04-03 07:19:10.162 [rank:7] [eval], epoch: 5/50, iter: 125/125, loss: 0.00000, lr: 1.482068, top1: 0.43328, throughput: 484.05 | 2022-04-03 07:19:10.168 [rank:1] [eval], epoch: 5/50, iter: 125/125, loss: 0.00000, lr: 1.482068, top1: 0.43808, throughput: 484.71 | 2022-04-03 07:19:10.171 [rank:5] [eval], epoch: 5/50, iter: 125/125, loss: 0.00000, lr: 1.482068, top1: 0.41808, throughput: 485.37 | 2022-04-03 07:19:10.173 [rank:6] [eval], epoch: 5/50, iter: 125/125, loss: 0.00000, lr: 1.482068, top1: 0.43392, throughput: 483.37 | 2022-04-03 07:19:10.173 [rank:2] [eval], epoch: 5/50, iter: 125/125, loss: 0.00000, lr: 1.482068, top1: 0.42544, throughput: 483.28 | 2022-04-03 07:19:10.178 [rank:4] [eval], epoch: 5/50, iter: 125/125, loss: 0.00000, lr: 1.482068, top1: 0.42496, throughput: 483.55 | 2022-04-03 07:19:10.174 [rank:3] [eval], epoch: 5/50, iter: 125/125, loss: 0.00000, lr: 1.482068, top1: 0.43392, throughput: 483.04 | 2022-04-03 07:19:10.215 [rank:2] [train], epoch: 6/50, iter: 100/834, loss: 0.40659, lr: 1.479918, top1: 0.46021, throughput: 312.80 | 2022-04-03 07:20:11.559 [rank:7] [train], epoch: 6/50, iter: 100/834, loss: 0.40745, lr: 1.479918, top1: 0.45760, throughput: 312.66 | 2022-04-03 07:20:11.576 [rank:1] [train], epoch: 6/50, iter: 100/834, loss: 0.40648, lr: 1.479918, top1: 0.46115, throughput: 312.60 | 2022-04-03 07:20:11.592 [rank:3] [train], epoch: 6/50, iter: 100/834, loss: 0.40228, lr: 1.479918, top1: 0.47068, throughput: 312.80 | 2022-04-03 07:20:11.596 [rank:6] [train], epoch: 6/50, iter: 100/834, loss: 0.40655, lr: 1.479918, top1: 0.46495, throughput: 312.50 | 2022-04-03 07:20:11.614 [rank:0] [train], epoch: 6/50, iter: 100/834, loss: 0.40725, lr: 1.479918, top1: 0.45911, throughput: 312.43 | 2022-04-03 07:20:11.616 [rank:4] [train], epoch: 6/50, iter: 100/834, loss: 0.40783, lr: 1.479918, top1: 0.46047, throughput: 312.43 | 2022-04-03 07:20:11.627 [rank:5] [train], epoch: 6/50, iter: 100/834, loss: 0.40469, lr: 1.479918, top1: 0.46370, throughput: 312.36 | 2022-04-03 07:20:11.641 [rank:1] [train], epoch: 6/50, iter: 200/834, loss: 0.40505, lr: 1.477728, top1: 0.46453, throughput: 313.13 | 2022-04-03 07:21:12.909 [rank:6] [train], epoch: 6/50, iter: 200/834, loss: 0.40140, lr: 1.477728, top1: 0.46604, throughput: 313.05 | 2022-04-03 07:21:12.945 [rank:2] [train], epoch: 6/50, iter: 200/834, loss: 0.40891, lr: 1.477728, top1: 0.45594, throughput: 312.70 | 2022-04-03 07:21:12.960 [rank:7] [train], epoch: 6/50, iter: 200/834, loss: 0.40554, lr: 1.477728, top1: 0.46125, throughput: 312.62 | 2022-04-03 07:21:12.992 [rank:5] [train], epoch: 6/50, iter: 200/834, loss: 0.40438, lr: 1.477728, top1: 0.46547, throughput: 312.84 | 2022-04-03 07:21:13.014 [rank:3] [train], epoch: 6/50, iter: 200/834, loss: 0.40126, lr: 1.477728, top1: 0.46714, throughput: 312.56 | 2022-04-03 07:21:13.024 [rank:0] [train], epoch: 6/50, iter: 200/834, loss: 0.40159, lr: 1.477728, top1: 0.46526, throughput: 313.03 | 2022-04-03 07:21:12.952 [rank:4] [train], epoch: 6/50, iter: 200/834, loss: 0.40717, lr: 1.477728, top1: 0.45995, throughput: 312.61 | 2022-04-03 07:21:13.046 [rank:6] [train], epoch: 6/50, iter: 300/834, loss: 0.40332, lr: 1.475497, top1: 0.46276, throughput: 312.31 | 2022-04-03 07:22:14.422 [rank:2] [train], epoch: 6/50, iter: 300/834, loss: 0.40418, lr: 1.475497, top1: 0.46568, throughput: 312.25 | 2022-04-03 07:22:14.449 [rank:7] [train], epoch: 6/50, iter: 300/834, loss: 0.40377, lr: 1.475497, top1: 0.46792, throughput: 312.25 | 2022-04-03 07:22:14.480 [rank:1] [train], epoch: 6/50, iter: 300/834, loss: 0.40731, lr: 1.475497, top1: 0.45620, throughput: 311.68 | 2022-04-03 07:22:14.511 [rank:4] [train], epoch: 6/50, iter: 300/834, loss: 0.40168, lr: 1.475497, top1: 0.46651, throughput: 312.26 | 2022-04-03 07:22:14.534 [rank:0] [train], epoch: 6/50, iter: 300/834, loss: 0.40411, lr: 1.475497, top1: 0.46464, throughput: 311.78 | 2022-04-03 07:22:14.534 [rank:5] [train], epoch: 6/50, iter: 300/834, loss: 0.40312, lr: 1.475497, top1: 0.46406, throughput: 312.07 | 2022-04-03 07:22:14.539 [rank:3] [train], epoch: 6/50, iter: 300/834, loss: 0.40890, lr: 1.475497, top1: 0.45401, throughput: 311.82 | 2022-04-03 07:22:14.598 [rank:5] [train], epoch: 6/50, iter: 400/834, loss: 0.40268, lr: 1.473226, top1: 0.47214, throughput: 313.85 | 2022-04-03 07:23:15.714 [rank:7] [train], epoch: 6/50, iter: 400/834, loss: 0.40083, lr: 1.473226, top1: 0.46880, throughput: 313.48 | 2022-04-03 07:23:15.727 [rank:2] [train], epoch: 6/50, iter: 400/834, loss: 0.40150, lr: 1.473226, top1: 0.46703, throughput: 313.19 | 2022-04-03 07:23:15.754 [rank:3] [train], epoch: 6/50, iter: 400/834, loss: 0.40115, lr: 1.473226, top1: 0.46937, throughput: 313.95 | 2022-04-03 07:23:15.754 [rank:1] [train], epoch: 6/50, iter: 400/834, loss: 0.40373, lr: 1.473226, top1: 0.46380, throughput: 313.47 | 2022-04-03 07:23:15.760 [rank:6] [train], epoch: 6/50, iter: 400/834, loss: 0.40199, lr: 1.473226, top1: 0.46568, throughput: 313.01 | 2022-04-03 07:23:15.763 [rank:0] [train], epoch: 6/50, iter: 400/834, loss: 0.40418, lr: 1.473226, top1: 0.46531, throughput: 313.50 | 2022-04-03 07:23:15.778 [rank:4] [train], epoch: 6/50, iter: 400/834, loss: 0.40597, lr: 1.473226, top1: 0.45635, throughput: 313.49 | 2022-04-03 07:23:15.780 [rank:5] [train], epoch: 6/50, iter: 500/834, loss: 0.39703, lr: 1.470915, top1: 0.47672, throughput: 312.64 | 2022-04-03 07:24:17.127 [rank:7] [train], epoch: 6/50, iter: 500/834, loss: 0.40325, lr: 1.470915, top1: 0.46505, throughput: 312.44 | 2022-04-03 07:24:17.179 [rank:1] [train], epoch: 6/50, iter: 500/834, loss: 0.40213, lr: 1.470915, top1: 0.46812, throughput: 312.56 | 2022-04-03 07:24:17.188 [rank:3] [train], epoch: 6/50, iter: 500/834, loss: 0.40140, lr: 1.470915, top1: 0.47052, throughput: 312.39 | 2022-04-03 07:24:17.215 [rank:0] [train], epoch: 6/50, iter: 500/834, loss: 0.40235, lr: 1.470915, top1: 0.46750, throughput: 312.50 | 2022-04-03 07:24:17.219 [rank:2] [train], epoch: 6/50, iter: 500/834, loss: 0.40270, lr: 1.470915, top1: 0.46651, throughput: 312.35 | 2022-04-03 07:24:17.224 [rank:6] [train], epoch: 6/50, iter: 500/834, loss: 0.40220, lr: 1.470915, top1: 0.46562, throughput: 312.37 | 2022-04-03 07:24:17.227 [rank:4] [train], epoch: 6/50, iter: 500/834, loss: 0.40303, lr: 1.470915, top1: 0.47073, throughput: 312.19 | 2022-04-03 07:24:17.281 [rank:6] [train], epoch: 6/50, iter: 600/834, loss: 0.39904, lr: 1.468564, top1: 0.47599, throughput: 312.48 | 2022-04-03 07:25:18.671 [rank:3] [train], epoch: 6/50, iter: 600/834, loss: 0.40031, lr: 1.468564, top1: 0.47016, throughput: 312.24 | 2022-04-03 07:25:18.705 [rank:7] [train], epoch: 6/50, iter: 600/834, loss: 0.40339, lr: 1.468564, top1: 0.46839, throughput: 312.01 | 2022-04-03 07:25:18.716 [rank:1] [train], epoch: 6/50, iter: 600/834, loss: 0.39881, lr: 1.468564, top1: 0.47333, throughput: 312.02 | 2022-04-03 07:25:18.722 [rank:5] [train], epoch: 6/50, iter: 600/834, loss: 0.40011, lr: 1.468564, top1: 0.47297, throughput: 311.56 | 2022-04-03 07:25:18.751 [rank:0] [train], epoch: 6/50, iter: 600/834, loss: 0.40026, lr: 1.468564, top1: 0.47068, throughput: 312.02 | 2022-04-03 07:25:18.753 [rank:4] [train], epoch: 6/50, iter: 600/834, loss: 0.39947, lr: 1.468564, top1: 0.47448, throughput: 312.10 | 2022-04-03 07:25:18.800 [rank:2] [train], epoch: 6/50, iter: 600/834, loss: 0.40080, lr: 1.468564, top1: 0.47036, throughput: 311.73 | 2022-04-03 07:25:18.816 [rank:1] [train], epoch: 6/50, iter: 700/834, loss: 0.39766, lr: 1.466173, top1: 0.47635, throughput: 312.14 | 2022-04-03 07:26:20.234 [rank:5] [train], epoch: 6/50, iter: 700/834, loss: 0.39919, lr: 1.466173, top1: 0.47349, throughput: 312.05 | 2022-04-03 07:26:20.279 [rank:7] [train], epoch: 6/50, iter: 700/834, loss: 0.39930, lr: 1.466173, top1: 0.47109, throughput: 311.85 | 2022-04-03 07:26:20.285 [rank:0] [train], epoch: 6/50, iter: 700/834, loss: 0.39818, lr: 1.466173, top1: 0.47557, throughput: 312.03 | 2022-04-03 07:26:20.286 [rank:4] [train], epoch: 6/50, iter: 700/834, loss: 0.39719, lr: 1.466173, top1: 0.47240, throughput: 312.18 | 2022-04-03 07:26:20.302 [rank:3] [train], epoch: 6/50, iter: 700/834, loss: 0.39790, lr: 1.466173, top1: 0.47255, throughput: 311.68 | 2022-04-03 07:26:20.306 [rank:2] [train], epoch: 6/50, iter: 700/834, loss: 0.39924, lr: 1.466173, top1: 0.47203, throughput: 312.04 | 2022-04-03 07:26:20.346 [rank:6] [train], epoch: 6/50, iter: 700/834, loss: 0.40170, lr: 1.466173, top1: 0.47104, throughput: 311.71 | 2022-04-03 07:26:20.266 [rank:5] [train], epoch: 6/50, iter: 800/834, loss: 0.39850, lr: 1.463742, top1: 0.47557, throughput: 313.52 | 2022-04-03 07:27:21.520 [rank:7] [train], epoch: 6/50, iter: 800/834, loss: 0.39956, lr: 1.463742, top1: 0.47375, throughput: 313.54 | 2022-04-03 07:27:21.521 [rank:0] [train], epoch: 6/50, iter: 800/834, loss: 0.39590, lr: 1.463742, top1: 0.47927, throughput: 313.35 | 2022-04-03 07:27:21.560 [rank:4] [train], epoch: 6/50, iter: 800/834, loss: 0.39566, lr: 1.463742, top1: 0.47604, throughput: 313.42 | 2022-04-03 07:27:21.561 [rank:1] [train], epoch: 6/50, iter: 800/834, loss: 0.39527, lr: 1.463742, top1: 0.48250, throughput: 312.96 | 2022-04-03 07:27:21.584 [rank:3] [train], epoch: 6/50, iter: 800/834, loss: 0.39919, lr: 1.463742, top1: 0.47339, throughput: 313.31 | 2022-04-03 07:27:21.587 [rank:6] [train], epoch: 6/50, iter: 800/834, loss: 0.39589, lr: 1.463742, top1: 0.47807, throughput: 313.11 | 2022-04-03 07:27:21.587 [rank:2] [train], epoch: 6/50, iter: 800/834, loss: 0.39536, lr: 1.463742, top1: 0.47620, throughput: 313.46 | 2022-04-03 07:27:21.598 [rank:6] [train], epoch: 6/50, iter: 834/834, loss: 0.39656, lr: 1.462907, top1: 0.47687, throughput: 312.19 | 2022-04-03 07:27:42.497 [rank:5] [train], epoch: 6/50, iter: 834/834, loss: 0.39772, lr: 1.462907, top1: 0.46875, throughput: 311.17 | 2022-04-03 07:27:42.499 [rank:2] [train], epoch: 6/50, iter: 834/834, loss: 0.40016, lr: 1.462907, top1: 0.47227, throughput: 312.32 | 2022-04-03 07:27:42.500 [rank:3] [train], epoch: 6/50, iter: 834/834, loss: 0.39611, lr: 1.462907, top1: 0.47549, throughput: 312.14 | 2022-04-03 07:27:42.500 [rank:7] [train], epoch: 6/50, iter: 834/834, loss: 0.39492, lr: 1.462907, top1: 0.48116, throughput: 311.16 | 2022-04-03 07:27:42.501 [rank:0] [train], epoch: 6/50, iter: 834/834, loss: 0.39256, lr: 1.462907, top1: 0.48545, throughput: 311.73 | 2022-04-03 07:27:42.501 [rank:1] [train], epoch: 6/50, iter: 834/834, loss: 0.39865, lr: 1.462907, top1: 0.47457, throughput: 312.07 | 2022-04-03 07:27:42.502 [rank:4] [train], epoch: 6/50, iter: 834/834, loss: 0.39781, lr: 1.462907, top1: 0.47518, throughput: 311.42 | 2022-04-03 07:27:42.523 [rank:4] [eval], epoch: 6/50, iter: 125/125, loss: 0.00000, lr: 1.462907, top1: 0.46384, throughput: 485.77 | 2022-04-03 07:27:55.389 [rank:0] [eval], epoch: 6/50, iter: 125/125, loss: 0.00000, lr: 1.462907, top1: 0.48112, throughput: 484.91 | 2022-04-03 07:27:55.390 [rank:1] [eval], epoch: 6/50, iter: 125/125, loss: 0.00000, lr: 1.462907, top1: 0.48048, throughput: 484.88 | 2022-04-03 07:27:55.392 [rank:7] [eval], epoch: 6/50, iter: 125/125, loss: 0.00000, lr: 1.462907, top1: 0.47808, throughput: 484.69 | 2022-04-03 07:27:55.395 [rank:6] [eval], epoch: 6/50, iter: 125/125, loss: 0.00000, lr: 1.462907, top1: 0.47360, throughput: 484.45 | 2022-04-03 07:27:55.398 [rank:2] [eval], epoch: 6/50, iter: 125/125, loss: 0.00000, lr: 1.462907, top1: 0.47744, throughput: 484.48 | 2022-04-03 07:27:55.400 [rank:5] [eval], epoch: 6/50, iter: 125/125, loss: 0.00000, lr: 1.462907, top1: 0.45904, throughput: 484.33 | 2022-04-03 07:27:55.404 [rank:3] [eval], epoch: 6/50, iter: 125/125, loss: 0.00000, lr: 1.462907, top1: 0.46320, throughput: 483.60 | 2022-04-03 07:27:55.424 [rank:5] [train], epoch: 7/50, iter: 100/834, loss: 0.39047, lr: 1.460424, top1: 0.49078, throughput: 312.36 | 2022-04-03 07:28:56.872 [rank:6] [train], epoch: 7/50, iter: 100/834, loss: 0.39307, lr: 1.460424, top1: 0.48286, throughput: 312.33 | 2022-04-03 07:28:56.872 [rank:7] [train], epoch: 7/50, iter: 100/834, loss: 0.39080, lr: 1.460424, top1: 0.48609, throughput: 312.31 | 2022-04-03 07:28:56.873 [rank:4] [train], epoch: 7/50, iter: 100/834, loss: 0.39037, lr: 1.460424, top1: 0.48641, throughput: 312.13 | 2022-04-03 07:28:56.902 [rank:2] [train], epoch: 7/50, iter: 100/834, loss: 0.39361, lr: 1.460424, top1: 0.48281, throughput: 312.13 | 2022-04-03 07:28:56.914 [rank:0] [train], epoch: 7/50, iter: 100/834, loss: 0.38639, lr: 1.460424, top1: 0.49672, throughput: 312.04 | 2022-04-03 07:28:56.921 [rank:3] [train], epoch: 7/50, iter: 100/834, loss: 0.39308, lr: 1.460424, top1: 0.48609, throughput: 312.12 | 2022-04-03 07:28:56.939 [rank:1] [train], epoch: 7/50, iter: 100/834, loss: 0.39268, lr: 1.460424, top1: 0.48458, throughput: 311.95 | 2022-04-03 07:28:56.940 [rank:2] [train], epoch: 7/50, iter: 200/834, loss: 0.39036, lr: 1.457901, top1: 0.48750, throughput: 311.92 | 2022-04-03 07:29:58.468 [rank:7] [train], epoch: 7/50, iter: 200/834, loss: 0.39436, lr: 1.457901, top1: 0.48052, throughput: 311.67 | 2022-04-03 07:29:58.477 [rank:6] [train], epoch: 7/50, iter: 200/834, loss: 0.39084, lr: 1.457901, top1: 0.48875, throughput: 311.53 | 2022-04-03 07:29:58.502 [rank:1] [train], epoch: 7/50, iter: 200/834, loss: 0.38870, lr: 1.457901, top1: 0.49401, throughput: 311.87 | 2022-04-03 07:29:58.503 [rank:5] [train], epoch: 7/50, iter: 200/834, loss: 0.39023, lr: 1.457901, top1: 0.48526, throughput: 311.52 | 2022-04-03 07:29:58.504 [rank:3] [train], epoch: 7/50, iter: 200/834, loss: 0.39302, lr: 1.457901, top1: 0.47984, throughput: 311.73 | 2022-04-03 07:29:58.531 [rank:0] [train], epoch: 7/50, iter: 200/834, loss: 0.38920, lr: 1.457901, top1: 0.49266, throughput: 311.60 | 2022-04-03 07:29:58.538 [rank:4] [train], epoch: 7/50, iter: 200/834, loss: 0.39149, lr: 1.457901, top1: 0.48505, throughput: 311.46 | 2022-04-03 07:29:58.547 [rank:7] [train], epoch: 7/50, iter: 300/834, loss: 0.39166, lr: 1.455340, top1: 0.48536, throughput: 313.28 | 2022-04-03 07:30:59.763 [rank:5] [train], epoch: 7/50, iter: 300/834, loss: 0.39025, lr: 1.455340, top1: 0.48505, throughput: 313.27 | 2022-04-03 07:30:59.793 [rank:2] [train], epoch: 7/50, iter: 300/834, loss: 0.39197, lr: 1.455340, top1: 0.48359, throughput: 313.08 | 2022-04-03 07:30:59.794 [rank:6] [train], epoch: 7/50, iter: 300/834, loss: 0.38907, lr: 1.455340, top1: 0.49151, throughput: 313.20 | 2022-04-03 07:30:59.805 [rank:1] [train], epoch: 7/50, iter: 300/834, loss: 0.39388, lr: 1.455340, top1: 0.47875, throughput: 313.18 | 2022-04-03 07:30:59.811 [rank:4] [train], epoch: 7/50, iter: 300/834, loss: 0.38925, lr: 1.455340, top1: 0.48620, throughput: 313.40 | 2022-04-03 07:30:59.811 [rank:3] [train], epoch: 7/50, iter: 300/834, loss: 0.38779, lr: 1.455340, top1: 0.49312, throughput: 313.28 | 2022-04-03 07:30:59.818 [rank:0] [train], epoch: 7/50, iter: 300/834, loss: 0.39108, lr: 1.455340, top1: 0.48552, throughput: 313.29 | 2022-04-03 07:30:59.822 [rank:7] [train], epoch: 7/50, iter: 400/834, loss: 0.39242, lr: 1.452739, top1: 0.48547, throughput: 313.90 | 2022-04-03 07:32:00.930 [rank:3] [train], epoch: 7/50, iter: 400/834, loss: 0.38863, lr: 1.452739, top1: 0.49406, throughput: 314.11 | 2022-04-03 07:32:00.943 [rank:2] [train], epoch: 7/50, iter: 400/834, loss: 0.38824, lr: 1.452739, top1: 0.49297, throughput: 313.92 | 2022-04-03 07:32:00.957 [rank:4] [train], epoch: 7/50, iter: 400/834, loss: 0.38899, lr: 1.452739, top1: 0.48922, throughput: 313.98 | 2022-04-03 07:32:00.962 [rank:1] [train], epoch: 7/50, iter: 400/834, loss: 0.38821, lr: 1.452739, top1: 0.49354, throughput: 313.97 | 2022-04-03 07:32:00.964 [rank:6] [train], epoch: 7/50, iter: 400/834, loss: 0.38595, lr: 1.452739, top1: 0.49411, throughput: 313.91 | 2022-04-03 07:32:00.968 [rank:5] [train], epoch: 7/50, iter: 400/834, loss: 0.38870, lr: 1.452739, top1: 0.49229, throughput: 313.75 | 2022-04-03 07:32:00.988 [rank:0] [train], epoch: 7/50, iter: 400/834, loss: 0.38846, lr: 1.452739, top1: 0.48755, throughput: 313.86 | 2022-04-03 07:32:00.996 [rank:6] [train], epoch: 7/50, iter: 500/834, loss: 0.39046, lr: 1.450099, top1: 0.48781, throughput: 311.35 | 2022-04-03 07:33:02.636 [rank:1] [train], epoch: 7/50, iter: 500/834, loss: 0.38920, lr: 1.450099, top1: 0.48609, throughput: 311.26 | 2022-04-03 07:33:02.648 [rank:7] [train], epoch: 7/50, iter: 500/834, loss: 0.38900, lr: 1.450099, top1: 0.49099, throughput: 311.04 | 2022-04-03 07:33:02.659 [rank:3] [train], epoch: 7/50, iter: 500/834, loss: 0.38761, lr: 1.450099, top1: 0.48865, throughput: 310.97 | 2022-04-03 07:33:02.685 [rank:5] [train], epoch: 7/50, iter: 500/834, loss: 0.38790, lr: 1.450099, top1: 0.49130, throughput: 311.15 | 2022-04-03 07:33:02.694 [rank:2] [train], epoch: 7/50, iter: 500/834, loss: 0.38829, lr: 1.450099, top1: 0.49297, throughput: 310.99 | 2022-04-03 07:33:02.694 [rank:0] [train], epoch: 7/50, iter: 500/834, loss: 0.38825, lr: 1.450099, top1: 0.48698, throughput: 311.18 | 2022-04-03 07:33:02.696 [rank:4] [train], epoch: 7/50, iter: 500/834, loss: 0.39225, lr: 1.450099, top1: 0.48438, throughput: 310.95 | 2022-04-03 07:33:02.709 [rank:1] [train], epoch: 7/50, iter: 600/834, loss: 0.39194, lr: 1.447421, top1: 0.48448, throughput: 312.29 | 2022-04-03 07:34:04.130 [rank:7] [train], epoch: 7/50, iter: 600/834, loss: 0.38612, lr: 1.447421, top1: 0.49849, throughput: 312.27 | 2022-04-03 07:34:04.144 [rank:2] [train], epoch: 7/50, iter: 600/834, loss: 0.38965, lr: 1.447421, top1: 0.48484, throughput: 312.42 | 2022-04-03 07:34:04.150 [rank:3] [train], epoch: 7/50, iter: 600/834, loss: 0.38911, lr: 1.447421, top1: 0.49021, throughput: 312.36 | 2022-04-03 07:34:04.152 [rank:6] [train], epoch: 7/50, iter: 600/834, loss: 0.38787, lr: 1.447421, top1: 0.48828, throughput: 311.92 | 2022-04-03 07:34:04.190 [rank:4] [train], epoch: 7/50, iter: 600/834, loss: 0.38770, lr: 1.447421, top1: 0.49526, throughput: 312.25 | 2022-04-03 07:34:04.198 [rank:5] [train], epoch: 7/50, iter: 600/834, loss: 0.38884, lr: 1.447421, top1: 0.48917, throughput: 312.17 | 2022-04-03 07:34:04.199 [rank:0] [train], epoch: 7/50, iter: 600/834, loss: 0.38557, lr: 1.447421, top1: 0.49854, throughput: 312.13 | 2022-04-03 07:34:04.210 [rank:3] [train], epoch: 7/50, iter: 700/834, loss: 0.38674, lr: 1.444704, top1: 0.49646, throughput: 312.34 | 2022-04-03 07:35:05.623 [rank:7] [train], epoch: 7/50, iter: 700/834, loss: 0.38718, lr: 1.444704, top1: 0.49474, throughput: 312.25 | 2022-04-03 07:35:05.633 [rank:2] [train], epoch: 7/50, iter: 700/834, loss: 0.38666, lr: 1.444704, top1: 0.49036, throughput: 312.22 | 2022-04-03 07:35:05.645 [rank:1] [train], epoch: 7/50, iter: 700/834, loss: 0.38703, lr: 1.444704, top1: 0.49255, throughput: 312.11 | 2022-04-03 07:35:05.648 [rank:5] [train], epoch: 7/50, iter: 700/834, loss: 0.39090, lr: 1.444704, top1: 0.48604, throughput: 312.24 | 2022-04-03 07:35:05.690 [rank:4] [train], epoch: 7/50, iter: 700/834, loss: 0.38768, lr: 1.444704, top1: 0.49635, throughput: 312.17 | 2022-04-03 07:35:05.703 [rank:0] [train], epoch: 7/50, iter: 700/834, loss: 0.38887, lr: 1.444704, top1: 0.48818, throughput: 312.17 | 2022-04-03 07:35:05.715 [rank:6] [train], epoch: 7/50, iter: 700/834, loss: 0.38911, lr: 1.444704, top1: 0.48547, throughput: 312.48 | 2022-04-03 07:35:05.634 [rank:7] [train], epoch: 7/50, iter: 800/834, loss: 0.38668, lr: 1.441949, top1: 0.49266, throughput: 312.27 | 2022-04-03 07:36:07.119 [rank:2] [train], epoch: 7/50, iter: 800/834, loss: 0.38441, lr: 1.441949, top1: 0.49917, throughput: 312.14 | 2022-04-03 07:36:07.156 [rank:0] [train], epoch: 7/50, iter: 800/834, loss: 0.38686, lr: 1.441949, top1: 0.49484, throughput: 312.38 | 2022-04-03 07:36:07.178 [rank:4] [train], epoch: 7/50, iter: 800/834, loss: 0.39023, lr: 1.441949, top1: 0.48411, throughput: 312.25 | 2022-04-03 07:36:07.191 [rank:6] [train], epoch: 7/50, iter: 800/834, loss: 0.38650, lr: 1.441949, top1: 0.49281, throughput: 311.90 | 2022-04-03 07:36:07.192 [rank:5] [train], epoch: 7/50, iter: 800/834, loss: 0.38635, lr: 1.441949, top1: 0.49771, throughput: 312.16 | 2022-04-03 07:36:07.198 [rank:1] [train], epoch: 7/50, iter: 800/834, loss: 0.38874, lr: 1.441949, top1: 0.48740, throughput: 311.90 | 2022-04-03 07:36:07.205 [rank:3] [train], epoch: 7/50, iter: 800/834, loss: 0.39010, lr: 1.441949, top1: 0.48932, throughput: 311.71 | 2022-04-03 07:36:07.219 [rank:5] [train], epoch: 7/50, iter: 834/834, loss: 0.38616, lr: 1.441004, top1: 0.49556, throughput: 312.88 | 2022-04-03 07:36:28.062 [rank:3] [train], epoch: 7/50, iter: 834/834, loss: 0.38447, lr: 1.441004, top1: 0.50184, throughput: 313.08 | 2022-04-03 07:36:28.070 [rank:2] [train], epoch: 7/50, iter: 834/834, loss: 0.38390, lr: 1.441004, top1: 0.50000, throughput: 312.11 | 2022-04-03 07:36:28.071 [rank:6] [train], epoch: 7/50, iter: 834/834, loss: 0.38768, lr: 1.441004, top1: 0.48943, throughput: 312.63 | 2022-04-03 07:36:28.073 [rank:1] [train], epoch: 7/50, iter: 834/834, loss: 0.38281, lr: 1.441004, top1: 0.50398, throughput: 312.78 | 2022-04-03 07:36:28.076 [rank:7] [train], epoch: 7/50, iter: 834/834, loss: 0.38202, lr: 1.441004, top1: 0.49893, throughput: 311.47 | 2022-04-03 07:36:28.077 [rank:0] [train], epoch: 7/50, iter: 834/834, loss: 0.39209, lr: 1.441004, top1: 0.48606, throughput: 312.29 | 2022-04-03 07:36:28.082 [rank:4] [train], epoch: 7/50, iter: 834/834, loss: 0.38810, lr: 1.441004, top1: 0.49510, throughput: 312.42 | 2022-04-03 07:36:28.086 [rank:5] [eval], epoch: 7/50, iter: 125/125, loss: 0.00000, lr: 1.441004, top1: 0.50224, throughput: 483.63 | 2022-04-03 07:36:40.985 [rank:4] [eval], epoch: 7/50, iter: 125/125, loss: 0.00000, lr: 1.441004, top1: 0.51104, throughput: 484.40 | 2022-04-03 07:36:40.988 [rank:0] [eval], epoch: 7/50, iter: 125/125, loss: 0.00000, lr: 1.441004, top1: 0.52176, throughput: 484.22 | 2022-04-03 07:36:40.989 [rank:6] [eval], epoch: 7/50, iter: 125/125, loss: 0.00000, lr: 1.441004, top1: 0.51872, throughput: 483.85 | 2022-04-03 07:36:40.990 [rank:7] [eval], epoch: 7/50, iter: 125/125, loss: 0.00000, lr: 1.441004, top1: 0.52464, throughput: 483.77 | 2022-04-03 07:36:40.997 [rank:1] [eval], epoch: 7/50, iter: 125/125, loss: 0.00000, lr: 1.441004, top1: 0.52016, throughput: 483.43 | 2022-04-03 07:36:41.004 [rank:2] [eval], epoch: 7/50, iter: 125/125, loss: 0.00000, lr: 1.441004, top1: 0.52512, throughput: 483.15 | 2022-04-03 07:36:41.007 [rank:3] [eval], epoch: 7/50, iter: 125/125, loss: 0.00000, lr: 1.441004, top1: 0.51392, throughput: 482.35 | 2022-04-03 07:36:41.028 [rank:6] [train], epoch: 8/50, iter: 100/834, loss: 0.38179, lr: 1.438197, top1: 0.50297, throughput: 313.53 | 2022-04-03 07:37:42.227 [rank:7] [train], epoch: 8/50, iter: 100/834, loss: 0.38032, lr: 1.438197, top1: 0.50161, throughput: 313.43 | 2022-04-03 07:37:42.254 [rank:2] [train], epoch: 8/50, iter: 100/834, loss: 0.37831, lr: 1.438197, top1: 0.50448, throughput: 313.46 | 2022-04-03 07:37:42.259 [rank:0] [train], epoch: 8/50, iter: 100/834, loss: 0.37643, lr: 1.438197, top1: 0.51318, throughput: 313.37 | 2022-04-03 07:37:42.259 [rank:5] [train], epoch: 8/50, iter: 100/834, loss: 0.38020, lr: 1.438197, top1: 0.51021, throughput: 313.34 | 2022-04-03 07:37:42.260 [rank:3] [train], epoch: 8/50, iter: 100/834, loss: 0.38051, lr: 1.438197, top1: 0.50193, throughput: 313.49 | 2022-04-03 07:37:42.274 [rank:4] [train], epoch: 8/50, iter: 100/834, loss: 0.37906, lr: 1.438197, top1: 0.50542, throughput: 313.24 | 2022-04-03 07:37:42.284 [rank:1] [train], epoch: 8/50, iter: 100/834, loss: 0.37898, lr: 1.438197, top1: 0.50563, throughput: 313.13 | 2022-04-03 07:37:42.321 [rank:6] [train], epoch: 8/50, iter: 200/834, loss: 0.38050, lr: 1.435353, top1: 0.50667, throughput: 312.09 | 2022-04-03 07:38:43.748 [rank:4] [train], epoch: 8/50, iter: 200/834, loss: 0.38347, lr: 1.435353, top1: 0.50156, throughput: 312.37 | 2022-04-03 07:38:43.749 [rank:3] [train], epoch: 8/50, iter: 200/834, loss: 0.38304, lr: 1.435353, top1: 0.49781, throughput: 312.23 | 2022-04-03 07:38:43.766 [rank:0] [train], epoch: 8/50, iter: 200/834, loss: 0.38299, lr: 1.435353, top1: 0.50057, throughput: 312.07 | 2022-04-03 07:38:43.785 [rank:5] [train], epoch: 8/50, iter: 200/834, loss: 0.38230, lr: 1.435353, top1: 0.49896, throughput: 312.02 | 2022-04-03 07:38:43.795 [rank:2] [train], epoch: 8/50, iter: 200/834, loss: 0.38201, lr: 1.435353, top1: 0.49937, throughput: 312.01 | 2022-04-03 07:38:43.796 [rank:1] [train], epoch: 8/50, iter: 200/834, loss: 0.38347, lr: 1.435353, top1: 0.49943, throughput: 312.31 | 2022-04-03 07:38:43.798 [rank:7] [train], epoch: 8/50, iter: 200/834, loss: 0.38157, lr: 1.435353, top1: 0.50099, throughput: 311.89 | 2022-04-03 07:38:43.815 [rank:7] [train], epoch: 8/50, iter: 300/834, loss: 0.37673, lr: 1.432470, top1: 0.51391, throughput: 313.86 | 2022-04-03 07:39:44.989 [rank:5] [train], epoch: 8/50, iter: 300/834, loss: 0.38042, lr: 1.432470, top1: 0.50167, throughput: 313.74 | 2022-04-03 07:39:44.992 [rank:6] [train], epoch: 8/50, iter: 300/834, loss: 0.38065, lr: 1.432470, top1: 0.50036, throughput: 313.46 | 2022-04-03 07:39:45.000 [rank:2] [train], epoch: 8/50, iter: 300/834, loss: 0.37906, lr: 1.432470, top1: 0.51385, throughput: 313.61 | 2022-04-03 07:39:45.018 [rank:1] [train], epoch: 8/50, iter: 300/834, loss: 0.38159, lr: 1.432470, top1: 0.49849, throughput: 313.54 | 2022-04-03 07:39:45.034 [rank:0] [train], epoch: 8/50, iter: 300/834, loss: 0.37993, lr: 1.432470, top1: 0.50271, throughput: 313.43 | 2022-04-03 07:39:45.043 [rank:3] [train], epoch: 8/50, iter: 300/834, loss: 0.38027, lr: 1.432470, top1: 0.50474, throughput: 313.24 | 2022-04-03 07:39:45.062 [rank:4] [train], epoch: 8/50, iter: 300/834, loss: 0.37788, lr: 1.432470, top1: 0.50906, throughput: 313.00 | 2022-04-03 07:39:45.091 [rank:6] [train], epoch: 8/50, iter: 400/834, loss: 0.37978, lr: 1.429550, top1: 0.50495, throughput: 313.45 | 2022-04-03 07:40:46.255 [rank:0] [train], epoch: 8/50, iter: 400/834, loss: 0.38213, lr: 1.429550, top1: 0.50156, throughput: 313.66 | 2022-04-03 07:40:46.257 [rank:1] [train], epoch: 8/50, iter: 400/834, loss: 0.37880, lr: 1.429550, top1: 0.50443, throughput: 313.60 | 2022-04-03 07:40:46.258 [rank:2] [train], epoch: 8/50, iter: 400/834, loss: 0.37902, lr: 1.429550, top1: 0.50792, throughput: 313.33 | 2022-04-03 07:40:46.294 [rank:4] [train], epoch: 8/50, iter: 400/834, loss: 0.38095, lr: 1.429550, top1: 0.50063, throughput: 313.68 | 2022-04-03 07:40:46.300 [rank:7] [train], epoch: 8/50, iter: 400/834, loss: 0.37921, lr: 1.429550, top1: 0.50901, throughput: 313.15 | 2022-04-03 07:40:46.302 [rank:5] [train], epoch: 8/50, iter: 400/834, loss: 0.38251, lr: 1.429550, top1: 0.50495, throughput: 313.09 | 2022-04-03 07:40:46.316 [rank:3] [train], epoch: 8/50, iter: 400/834, loss: 0.38137, lr: 1.429550, top1: 0.50161, throughput: 313.39 | 2022-04-03 07:40:46.327 [rank:0] [train], epoch: 8/50, iter: 500/834, loss: 0.38273, lr: 1.426592, top1: 0.50453, throughput: 312.70 | 2022-04-03 07:41:47.658 [rank:7] [train], epoch: 8/50, iter: 500/834, loss: 0.38257, lr: 1.426592, top1: 0.49948, throughput: 312.73 | 2022-04-03 07:41:47.698 [rank:3] [train], epoch: 8/50, iter: 500/834, loss: 0.37885, lr: 1.426592, top1: 0.50755, throughput: 312.70 | 2022-04-03 07:41:47.728 [rank:5] [train], epoch: 8/50, iter: 500/834, loss: 0.38124, lr: 1.426592, top1: 0.50563, throughput: 312.59 | 2022-04-03 07:41:47.738 [rank:1] [train], epoch: 8/50, iter: 500/834, loss: 0.38074, lr: 1.426592, top1: 0.50594, throughput: 312.28 | 2022-04-03 07:41:47.742 [rank:2] [train], epoch: 8/50, iter: 500/834, loss: 0.37966, lr: 1.426592, top1: 0.50839, throughput: 312.44 | 2022-04-03 07:41:47.747 [rank:6] [train], epoch: 8/50, iter: 500/834, loss: 0.37790, lr: 1.426592, top1: 0.50818, throughput: 312.22 | 2022-04-03 07:41:47.750 [rank:4] [train], epoch: 8/50, iter: 500/834, loss: 0.38125, lr: 1.426592, top1: 0.50281, throughput: 312.24 | 2022-04-03 07:41:47.791 [rank:7] [train], epoch: 8/50, iter: 600/834, loss: 0.37972, lr: 1.423597, top1: 0.50661, throughput: 312.15 | 2022-04-03 07:42:49.208 [rank:3] [train], epoch: 8/50, iter: 600/834, loss: 0.37822, lr: 1.423597, top1: 0.50630, throughput: 312.08 | 2022-04-03 07:42:49.250 [rank:6] [train], epoch: 8/50, iter: 600/834, loss: 0.37708, lr: 1.423597, top1: 0.51307, throughput: 312.15 | 2022-04-03 07:42:49.258 [rank:1] [train], epoch: 8/50, iter: 600/834, loss: 0.38173, lr: 1.423597, top1: 0.50245, throughput: 312.09 | 2022-04-03 07:42:49.262 [rank:0] [train], epoch: 8/50, iter: 600/834, loss: 0.37920, lr: 1.423597, top1: 0.50510, throughput: 311.59 | 2022-04-03 07:42:49.278 [rank:5] [train], epoch: 8/50, iter: 600/834, loss: 0.38107, lr: 1.423597, top1: 0.50401, throughput: 311.89 | 2022-04-03 07:42:49.297 [rank:2] [train], epoch: 8/50, iter: 600/834, loss: 0.37705, lr: 1.423597, top1: 0.51245, throughput: 311.93 | 2022-04-03 07:42:49.298 [rank:4] [train], epoch: 8/50, iter: 600/834, loss: 0.38111, lr: 1.423597, top1: 0.49943, throughput: 312.08 | 2022-04-03 07:42:49.313 [rank:0] [train], epoch: 8/50, iter: 700/834, loss: 0.37840, lr: 1.420565, top1: 0.50740, throughput: 311.97 | 2022-04-03 07:43:50.823 [rank:5] [train], epoch: 8/50, iter: 700/834, loss: 0.37895, lr: 1.420565, top1: 0.50422, throughput: 311.98 | 2022-04-03 07:43:50.840 [rank:6] [train], epoch: 8/50, iter: 700/834, loss: 0.37881, lr: 1.420565, top1: 0.50542, throughput: 311.65 | 2022-04-03 07:43:50.866 [rank:3] [train], epoch: 8/50, iter: 700/834, loss: 0.37828, lr: 1.420565, top1: 0.50953, throughput: 311.60 | 2022-04-03 07:43:50.867 [rank:1] [train], epoch: 8/50, iter: 700/834, loss: 0.37991, lr: 1.420565, top1: 0.50495, throughput: 311.61 | 2022-04-03 07:43:50.878 [rank:4] [train], epoch: 8/50, iter: 700/834, loss: 0.37680, lr: 1.420565, top1: 0.51234, throughput: 311.81 | 2022-04-03 07:43:50.890 [rank:2] [train], epoch: 8/50, iter: 700/834, loss: 0.38125, lr: 1.420565, top1: 0.50594, throughput: 311.64 | 2022-04-03 07:43:50.909 [rank:7] [train], epoch: 8/50, iter: 700/834, loss: 0.37792, lr: 1.420565, top1: 0.50807, throughput: 311.11 | 2022-04-03 07:43:50.923 [rank:7] [train], epoch: 8/50, iter: 800/834, loss: 0.38129, lr: 1.417496, top1: 0.50234, throughput: 313.57 | 2022-04-03 07:44:52.154 [rank:6] [train], epoch: 8/50, iter: 800/834, loss: 0.37866, lr: 1.417496, top1: 0.50573, throughput: 313.21 | 2022-04-03 07:44:52.166 [rank:5] [train], epoch: 8/50, iter: 800/834, loss: 0.38045, lr: 1.417496, top1: 0.50615, throughput: 312.95 | 2022-04-03 07:44:52.191 [rank:4] [train], epoch: 8/50, iter: 800/834, loss: 0.37793, lr: 1.417496, top1: 0.50854, throughput: 313.19 | 2022-04-03 07:44:52.195 [rank:3] [train], epoch: 8/50, iter: 800/834, loss: 0.37964, lr: 1.417496, top1: 0.50464, throughput: 313.02 | 2022-04-03 07:44:52.206 [rank:1] [train], epoch: 8/50, iter: 800/834, loss: 0.37838, lr: 1.417496, top1: 0.51151, throughput: 312.94 | 2022-04-03 07:44:52.232 [rank:0] [train], epoch: 8/50, iter: 800/834, loss: 0.37833, lr: 1.417496, top1: 0.50458, throughput: 313.11 | 2022-04-03 07:44:52.143 [rank:2] [train], epoch: 8/50, iter: 800/834, loss: 0.37676, lr: 1.417496, top1: 0.50891, throughput: 313.57 | 2022-04-03 07:44:52.139 [rank:3] [train], epoch: 8/50, iter: 834/834, loss: 0.37564, lr: 1.416444, top1: 0.50980, throughput: 313.18 | 2022-04-03 07:45:13.050 [rank:1] [train], epoch: 8/50, iter: 834/834, loss: 0.37883, lr: 1.416444, top1: 0.49556, throughput: 313.56 | 2022-04-03 07:45:13.051 [rank:5] [train], epoch: 8/50, iter: 834/834, loss: 0.38377, lr: 1.416444, top1: 0.50123, throughput: 312.50 | 2022-04-03 07:45:13.081 [rank:4] [train], epoch: 8/50, iter: 834/834, loss: 0.38158, lr: 1.416444, top1: 0.50061, throughput: 312.55 | 2022-04-03 07:45:13.082 [rank:7] [train], epoch: 8/50, iter: 834/834, loss: 0.37529, lr: 1.416444, top1: 0.51149, throughput: 311.92 | 2022-04-03 07:45:13.082 [rank:6] [train], epoch: 8/50, iter: 834/834, loss: 0.37900, lr: 1.416444, top1: 0.50398, throughput: 312.10 | 2022-04-03 07:45:13.082 [rank:0] [train], epoch: 8/50, iter: 834/834, loss: 0.38252, lr: 1.416444, top1: 0.49954, throughput: 311.75 | 2022-04-03 07:45:13.082 [rank:2] [train], epoch: 8/50, iter: 834/834, loss: 0.37615, lr: 1.416444, top1: 0.50873, throughput: 311.43 | 2022-04-03 07:45:13.100 [rank:0] [eval], epoch: 8/50, iter: 125/125, loss: 0.00000, lr: 1.416444, top1: 0.48928, throughput: 489.03 | 2022-04-03 07:45:25.863 [rank:2] [eval], epoch: 8/50, iter: 125/125, loss: 0.00000, lr: 1.416444, top1: 0.48640, throughput: 489.06 | 2022-04-03 07:45:25.879 [rank:7] [eval], epoch: 8/50, iter: 125/125, loss: 0.00000, lr: 1.416444, top1: 0.49440, throughput: 488.23 | 2022-04-03 07:45:25.884 [rank:6] [eval], epoch: 8/50, iter: 125/125, loss: 0.00000, lr: 1.416444, top1: 0.48688, throughput: 488.19 | 2022-04-03 07:45:25.884 [rank:4] [eval], epoch: 8/50, iter: 125/125, loss: 0.00000, lr: 1.416444, top1: 0.47792, throughput: 488.11 | 2022-04-03 07:45:25.886 [rank:5] [eval], epoch: 8/50, iter: 125/125, loss: 0.00000, lr: 1.416444, top1: 0.48064, throughput: 487.32 | 2022-04-03 07:45:25.906 [rank:3] [eval], epoch: 8/50, iter: 125/125, loss: 0.00000, lr: 1.416444, top1: 0.48112, throughput: 486.06 | 2022-04-03 07:45:25.909 [rank:1] [eval], epoch: 8/50, iter: 125/125, loss: 0.00000, lr: 1.416444, top1: 0.48224, throughput: 486.01 | 2022-04-03 07:45:25.911 [rank:6] [train], epoch: 9/50, iter: 100/834, loss: 0.37427, lr: 1.413325, top1: 0.51349, throughput: 312.48 | 2022-04-03 07:46:27.329 [rank:2] [train], epoch: 9/50, iter: 100/834, loss: 0.37349, lr: 1.413325, top1: 0.51453, throughput: 312.39 | 2022-04-03 07:46:27.342 [rank:4] [train], epoch: 9/50, iter: 100/834, loss: 0.37064, lr: 1.413325, top1: 0.52562, throughput: 312.35 | 2022-04-03 07:46:27.356 [rank:0] [train], epoch: 9/50, iter: 100/834, loss: 0.37108, lr: 1.413325, top1: 0.52135, throughput: 312.19 | 2022-04-03 07:46:27.364 [rank:7] [train], epoch: 9/50, iter: 100/834, loss: 0.37101, lr: 1.413325, top1: 0.52344, throughput: 312.19 | 2022-04-03 07:46:27.385 [rank:3] [train], epoch: 9/50, iter: 100/834, loss: 0.37293, lr: 1.413325, top1: 0.51818, throughput: 312.30 | 2022-04-03 07:46:27.388 [rank:1] [train], epoch: 9/50, iter: 100/834, loss: 0.37342, lr: 1.413325, top1: 0.51130, throughput: 312.30 | 2022-04-03 07:46:27.390 [rank:5] [train], epoch: 9/50, iter: 100/834, loss: 0.37547, lr: 1.413325, top1: 0.51109, throughput: 312.22 | 2022-04-03 07:46:27.401 [rank:1] [train], epoch: 9/50, iter: 200/834, loss: 0.37209, lr: 1.410170, top1: 0.51865, throughput: 313.54 | 2022-04-03 07:47:28.626 [rank:5] [train], epoch: 9/50, iter: 200/834, loss: 0.37475, lr: 1.410170, top1: 0.51188, throughput: 313.47 | 2022-04-03 07:47:28.651 [rank:7] [train], epoch: 9/50, iter: 200/834, loss: 0.37268, lr: 1.410170, top1: 0.51958, throughput: 313.34 | 2022-04-03 07:47:28.660 [rank:3] [train], epoch: 9/50, iter: 200/834, loss: 0.37591, lr: 1.410170, top1: 0.51193, throughput: 313.31 | 2022-04-03 07:47:28.669 [rank:4] [train], epoch: 9/50, iter: 200/834, loss: 0.37249, lr: 1.410170, top1: 0.51859, throughput: 313.14 | 2022-04-03 07:47:28.670 [rank:2] [train], epoch: 9/50, iter: 200/834, loss: 0.37324, lr: 1.410170, top1: 0.51104, throughput: 313.40 | 2022-04-03 07:47:28.605 [rank:0] [train], epoch: 9/50, iter: 200/834, loss: 0.37142, lr: 1.410170, top1: 0.52109, throughput: 313.05 | 2022-04-03 07:47:28.696 [rank:6] [train], epoch: 9/50, iter: 200/834, loss: 0.37311, lr: 1.410170, top1: 0.52234, throughput: 312.84 | 2022-04-03 07:47:28.703 [rank:7] [train], epoch: 9/50, iter: 300/834, loss: 0.37616, lr: 1.406978, top1: 0.51005, throughput: 312.22 | 2022-04-03 07:48:30.155 [rank:1] [train], epoch: 9/50, iter: 300/834, loss: 0.37068, lr: 1.406978, top1: 0.52073, throughput: 311.95 | 2022-04-03 07:48:30.174 [rank:5] [train], epoch: 9/50, iter: 300/834, loss: 0.37560, lr: 1.406978, top1: 0.51255, throughput: 312.06 | 2022-04-03 07:48:30.179 [rank:2] [train], epoch: 9/50, iter: 300/834, loss: 0.37446, lr: 1.406978, top1: 0.51531, throughput: 311.76 | 2022-04-03 07:48:30.191 [rank:0] [train], epoch: 9/50, iter: 300/834, loss: 0.37237, lr: 1.406978, top1: 0.52151, throughput: 312.17 | 2022-04-03 07:48:30.200 [rank:6] [train], epoch: 9/50, iter: 300/834, loss: 0.37263, lr: 1.406978, top1: 0.51568, throughput: 312.18 | 2022-04-03 07:48:30.205 [rank:4] [train], epoch: 9/50, iter: 300/834, loss: 0.37519, lr: 1.406978, top1: 0.51568, throughput: 311.96 | 2022-04-03 07:48:30.216 [rank:3] [train], epoch: 9/50, iter: 300/834, loss: 0.37377, lr: 1.406978, top1: 0.51568, throughput: 311.95 | 2022-04-03 07:48:30.218 [rank:6] [train], epoch: 9/50, iter: 400/834, loss: 0.37457, lr: 1.403750, top1: 0.51255, throughput: 314.47 | 2022-04-03 07:49:31.261 [rank:0] [train], epoch: 9/50, iter: 400/834, loss: 0.37142, lr: 1.403750, top1: 0.51839, throughput: 314.40 | 2022-04-03 07:49:31.269 [rank:7] [train], epoch: 9/50, iter: 400/834, loss: 0.37552, lr: 1.403750, top1: 0.51219, throughput: 314.15 | 2022-04-03 07:49:31.274 [rank:1] [train], epoch: 9/50, iter: 400/834, loss: 0.37197, lr: 1.403750, top1: 0.51995, throughput: 314.20 | 2022-04-03 07:49:31.281 [rank:5] [train], epoch: 9/50, iter: 400/834, loss: 0.37501, lr: 1.403750, top1: 0.51479, throughput: 314.20 | 2022-04-03 07:49:31.285 [rank:4] [train], epoch: 9/50, iter: 400/834, loss: 0.37293, lr: 1.403750, top1: 0.51417, throughput: 314.22 | 2022-04-03 07:49:31.319 [rank:2] [train], epoch: 9/50, iter: 400/834, loss: 0.37134, lr: 1.403750, top1: 0.52312, throughput: 314.09 | 2022-04-03 07:49:31.320 [rank:3] [train], epoch: 9/50, iter: 400/834, loss: 0.37230, lr: 1.403750, top1: 0.51391, throughput: 314.23 | 2022-04-03 07:49:31.320 [rank:4] [train], epoch: 9/50, iter: 500/834, loss: 0.37093, lr: 1.400486, top1: 0.52198, throughput: 312.64 | 2022-04-03 07:50:32.731 [rank:7] [train], epoch: 9/50, iter: 500/834, loss: 0.37187, lr: 1.400486, top1: 0.52109, throughput: 312.38 | 2022-04-03 07:50:32.737 [rank:1] [train], epoch: 9/50, iter: 500/834, loss: 0.37386, lr: 1.400486, top1: 0.51120, throughput: 312.35 | 2022-04-03 07:50:32.750 [rank:2] [train], epoch: 9/50, iter: 500/834, loss: 0.37374, lr: 1.400486, top1: 0.51089, throughput: 312.51 | 2022-04-03 07:50:32.759 [rank:0] [train], epoch: 9/50, iter: 500/834, loss: 0.36709, lr: 1.400486, top1: 0.53073, throughput: 312.16 | 2022-04-03 07:50:32.775 [rank:3] [train], epoch: 9/50, iter: 500/834, loss: 0.36881, lr: 1.400486, top1: 0.52448, throughput: 312.39 | 2022-04-03 07:50:32.781 [rank:5] [train], epoch: 9/50, iter: 500/834, loss: 0.37247, lr: 1.400486, top1: 0.51995, throughput: 312.06 | 2022-04-03 07:50:32.812 [rank:6] [train], epoch: 9/50, iter: 500/834, loss: 0.37203, lr: 1.400486, top1: 0.52182, throughput: 311.89 | 2022-04-03 07:50:32.820 [rank:3] [train], epoch: 9/50, iter: 600/834, loss: 0.36982, lr: 1.397186, top1: 0.52000, throughput: 313.94 | 2022-04-03 07:51:33.939 [rank:1] [train], epoch: 9/50, iter: 600/834, loss: 0.37185, lr: 1.397186, top1: 0.51693, throughput: 313.63 | 2022-04-03 07:51:33.968 [rank:7] [train], epoch: 9/50, iter: 600/834, loss: 0.36743, lr: 1.397186, top1: 0.52854, throughput: 313.54 | 2022-04-03 07:51:33.972 [rank:5] [train], epoch: 9/50, iter: 600/834, loss: 0.37352, lr: 1.397186, top1: 0.51646, throughput: 313.87 | 2022-04-03 07:51:33.983 [rank:0] [train], epoch: 9/50, iter: 600/834, loss: 0.37438, lr: 1.397186, top1: 0.51557, throughput: 313.63 | 2022-04-03 07:51:33.995 [rank:6] [train], epoch: 9/50, iter: 600/834, loss: 0.37181, lr: 1.397186, top1: 0.52297, throughput: 313.81 | 2022-04-03 07:51:34.005 [rank:2] [train], epoch: 9/50, iter: 600/834, loss: 0.37380, lr: 1.397186, top1: 0.51828, throughput: 313.47 | 2022-04-03 07:51:34.008 [rank:4] [train], epoch: 9/50, iter: 600/834, loss: 0.37112, lr: 1.397186, top1: 0.52516, throughput: 313.31 | 2022-04-03 07:51:34.011 [rank:3] [train], epoch: 9/50, iter: 700/834, loss: 0.37219, lr: 1.393851, top1: 0.52000, throughput: 313.93 | 2022-04-03 07:52:35.099 [rank:6] [train], epoch: 9/50, iter: 700/834, loss: 0.37372, lr: 1.393851, top1: 0.51760, throughput: 314.27 | 2022-04-03 07:52:35.100 [rank:7] [train], epoch: 9/50, iter: 700/834, loss: 0.37247, lr: 1.393851, top1: 0.52010, throughput: 313.97 | 2022-04-03 07:52:35.126 [rank:0] [train], epoch: 9/50, iter: 700/834, loss: 0.37472, lr: 1.393851, top1: 0.51406, throughput: 313.98 | 2022-04-03 07:52:35.145 [rank:2] [train], epoch: 9/50, iter: 700/834, loss: 0.37229, lr: 1.393851, top1: 0.51906, throughput: 314.05 | 2022-04-03 07:52:35.146 [rank:1] [train], epoch: 9/50, iter: 700/834, loss: 0.37107, lr: 1.393851, top1: 0.52047, throughput: 313.82 | 2022-04-03 07:52:35.150 [rank:5] [train], epoch: 9/50, iter: 700/834, loss: 0.37379, lr: 1.393851, top1: 0.51661, throughput: 313.87 | 2022-04-03 07:52:35.155 [rank:4] [train], epoch: 9/50, iter: 700/834, loss: 0.37627, lr: 1.393851, top1: 0.51141, throughput: 313.89 | 2022-04-03 07:52:35.180 [rank:3] [train], epoch: 9/50, iter: 800/834, loss: 0.37350, lr: 1.390479, top1: 0.51729, throughput: 312.04 | 2022-04-03 07:53:36.631 [rank:1] [train], epoch: 9/50, iter: 800/834, loss: 0.37256, lr: 1.390479, top1: 0.51604, throughput: 312.25 | 2022-04-03 07:53:36.638 [rank:6] [train], epoch: 9/50, iter: 800/834, loss: 0.37071, lr: 1.390479, top1: 0.51990, throughput: 311.86 | 2022-04-03 07:53:36.665 [rank:7] [train], epoch: 9/50, iter: 800/834, loss: 0.37030, lr: 1.390479, top1: 0.52000, throughput: 311.98 | 2022-04-03 07:53:36.669 [rank:2] [train], epoch: 9/50, iter: 800/834, loss: 0.37253, lr: 1.390479, top1: 0.51927, throughput: 312.02 | 2022-04-03 07:53:36.681 [rank:4] [train], epoch: 9/50, iter: 800/834, loss: 0.37214, lr: 1.390479, top1: 0.51818, throughput: 312.16 | 2022-04-03 07:53:36.687 [rank:5] [train], epoch: 9/50, iter: 800/834, loss: 0.36853, lr: 1.390479, top1: 0.52547, throughput: 311.90 | 2022-04-03 07:53:36.714 [rank:0] [train], epoch: 9/50, iter: 800/834, loss: 0.37164, lr: 1.390479, top1: 0.52104, throughput: 311.72 | 2022-04-03 07:53:36.739 [rank:1] [train], epoch: 9/50, iter: 834/834, loss: 0.37122, lr: 1.389325, top1: 0.51900, throughput: 313.77 | 2022-04-03 07:53:57.443 [rank:4] [train], epoch: 9/50, iter: 834/834, loss: 0.37284, lr: 1.389325, top1: 0.50597, throughput: 314.43 | 2022-04-03 07:53:57.448 [rank:7] [train], epoch: 9/50, iter: 834/834, loss: 0.37068, lr: 1.389325, top1: 0.52298, throughput: 314.14 | 2022-04-03 07:53:57.449 [rank:5] [train], epoch: 9/50, iter: 834/834, loss: 0.37390, lr: 1.389325, top1: 0.51271, throughput: 314.72 | 2022-04-03 07:53:57.456 [rank:3] [train], epoch: 9/50, iter: 834/834, loss: 0.37047, lr: 1.389325, top1: 0.52252, throughput: 313.45 | 2022-04-03 07:53:57.457 [rank:6] [train], epoch: 9/50, iter: 834/834, loss: 0.37075, lr: 1.389325, top1: 0.51639, throughput: 313.89 | 2022-04-03 07:53:57.462 [rank:0] [train], epoch: 9/50, iter: 834/834, loss: 0.37678, lr: 1.389325, top1: 0.51608, throughput: 314.87 | 2022-04-03 07:53:57.471 [rank:2] [train], epoch: 9/50, iter: 834/834, loss: 0.36892, lr: 1.389325, top1: 0.52405, throughput: 313.92 | 2022-04-03 07:53:57.476 [rank:0] [eval], epoch: 9/50, iter: 125/125, loss: 0.00000, lr: 1.389325, top1: 0.50064, throughput: 488.10 | 2022-04-03 07:54:10.276 [rank:4] [eval], epoch: 9/50, iter: 125/125, loss: 0.00000, lr: 1.389325, top1: 0.48528, throughput: 487.03 | 2022-04-03 07:54:10.281 [rank:6] [eval], epoch: 9/50, iter: 125/125, loss: 0.00000, lr: 1.389325, top1: 0.49040, throughput: 487.37 | 2022-04-03 07:54:10.286 [rank:7] [eval], epoch: 9/50, iter: 125/125, loss: 0.00000, lr: 1.389325, top1: 0.50000, throughput: 486.80 | 2022-04-03 07:54:10.288 [rank:2] [eval], epoch: 9/50, iter: 125/125, loss: 0.00000, lr: 1.389325, top1: 0.49392, throughput: 487.68 | 2022-04-03 07:54:10.292 [rank:1] [eval], epoch: 9/50, iter: 125/125, loss: 0.00000, lr: 1.389325, top1: 0.49216, throughput: 485.22 | 2022-04-03 07:54:10.324 [rank:3] [eval], epoch: 9/50, iter: 125/125, loss: 0.00000, lr: 1.389325, top1: 0.49232, throughput: 485.76 | 2022-04-03 07:54:10.324 [rank:5] [eval], epoch: 9/50, iter: 125/125, loss: 0.00000, lr: 1.389325, top1: 0.48208, throughput: 485.32 | 2022-04-03 07:54:10.334 [rank:0] [train], epoch: 10/50, iter: 100/834, loss: 0.36627, lr: 1.385907, top1: 0.53057, throughput: 312.06 | 2022-04-03 07:55:11.802 [rank:3] [train], epoch: 10/50, iter: 100/834, loss: 0.36481, lr: 1.385907, top1: 0.53078, throughput: 312.25 | 2022-04-03 07:55:11.813 [rank:6] [train], epoch: 10/50, iter: 100/834, loss: 0.36608, lr: 1.385907, top1: 0.52854, throughput: 311.95 | 2022-04-03 07:55:11.834 [rank:7] [train], epoch: 10/50, iter: 100/834, loss: 0.36755, lr: 1.385907, top1: 0.52490, throughput: 311.88 | 2022-04-03 07:55:11.851 [rank:4] [train], epoch: 10/50, iter: 100/834, loss: 0.36329, lr: 1.385907, top1: 0.53146, throughput: 311.84 | 2022-04-03 07:55:11.851 [rank:1] [train], epoch: 10/50, iter: 100/834, loss: 0.36661, lr: 1.385907, top1: 0.52755, throughput: 311.99 | 2022-04-03 07:55:11.863 [rank:5] [train], epoch: 10/50, iter: 100/834, loss: 0.36459, lr: 1.385907, top1: 0.53312, throughput: 312.04 | 2022-04-03 07:55:11.864 [rank:2] [train], epoch: 10/50, iter: 100/834, loss: 0.36195, lr: 1.385907, top1: 0.53750, throughput: 311.83 | 2022-04-03 07:55:11.865 [rank:2] [train], epoch: 10/50, iter: 200/834, loss: 0.36533, lr: 1.382453, top1: 0.52891, throughput: 315.28 | 2022-04-03 07:56:12.764 [rank:3] [train], epoch: 10/50, iter: 200/834, loss: 0.37010, lr: 1.382453, top1: 0.52271, throughput: 314.90 | 2022-04-03 07:56:12.784 [rank:1] [train], epoch: 10/50, iter: 200/834, loss: 0.36436, lr: 1.382453, top1: 0.53156, throughput: 315.15 | 2022-04-03 07:56:12.787 [rank:0] [train], epoch: 10/50, iter: 200/834, loss: 0.36616, lr: 1.382453, top1: 0.52802, throughput: 314.80 | 2022-04-03 07:56:12.792 [rank:5] [train], epoch: 10/50, iter: 200/834, loss: 0.36727, lr: 1.382453, top1: 0.52750, throughput: 315.05 | 2022-04-03 07:56:12.806 [rank:4] [train], epoch: 10/50, iter: 200/834, loss: 0.36448, lr: 1.382453, top1: 0.53010, throughput: 314.91 | 2022-04-03 07:56:12.822 [rank:6] [train], epoch: 10/50, iter: 200/834, loss: 0.36619, lr: 1.382453, top1: 0.53339, throughput: 314.73 | 2022-04-03 07:56:12.839 [rank:7] [train], epoch: 10/50, iter: 200/834, loss: 0.36634, lr: 1.382453, top1: 0.52932, throughput: 315.32 | 2022-04-03 07:56:12.741 [rank:0] [train], epoch: 10/50, iter: 300/834, loss: 0.36863, lr: 1.378965, top1: 0.52089, throughput: 314.09 | 2022-04-03 07:57:13.920 [rank:5] [train], epoch: 10/50, iter: 300/834, loss: 0.36695, lr: 1.378965, top1: 0.52792, throughput: 314.14 | 2022-04-03 07:57:13.925 [rank:1] [train], epoch: 10/50, iter: 300/834, loss: 0.36763, lr: 1.378965, top1: 0.52938, throughput: 313.91 | 2022-04-03 07:57:13.950 [rank:6] [train], epoch: 10/50, iter: 300/834, loss: 0.36317, lr: 1.378965, top1: 0.53536, throughput: 314.18 | 2022-04-03 07:57:13.951 [rank:2] [train], epoch: 10/50, iter: 300/834, loss: 0.36649, lr: 1.378965, top1: 0.53286, throughput: 313.79 | 2022-04-03 07:57:13.951 [rank:7] [train], epoch: 10/50, iter: 300/834, loss: 0.36577, lr: 1.378965, top1: 0.53443, throughput: 313.61 | 2022-04-03 07:57:13.963 [rank:3] [train], epoch: 10/50, iter: 300/834, loss: 0.36223, lr: 1.378965, top1: 0.53562, throughput: 313.79 | 2022-04-03 07:57:13.971 [rank:4] [train], epoch: 10/50, iter: 300/834, loss: 0.36415, lr: 1.378965, top1: 0.53469, throughput: 314.28 | 2022-04-03 07:57:13.914 [rank:2] [train], epoch: 10/50, iter: 400/834, loss: 0.36758, lr: 1.375441, top1: 0.52510, throughput: 313.35 | 2022-04-03 07:58:15.225 [rank:7] [train], epoch: 10/50, iter: 400/834, loss: 0.36515, lr: 1.375441, top1: 0.52880, throughput: 313.36 | 2022-04-03 07:58:15.234 [rank:1] [train], epoch: 10/50, iter: 400/834, loss: 0.36500, lr: 1.375441, top1: 0.52938, throughput: 313.26 | 2022-04-03 07:58:15.241 [rank:6] [train], epoch: 10/50, iter: 400/834, loss: 0.36526, lr: 1.375441, top1: 0.53469, throughput: 313.22 | 2022-04-03 07:58:15.250 [rank:5] [train], epoch: 10/50, iter: 400/834, loss: 0.36905, lr: 1.375441, top1: 0.52573, throughput: 313.02 | 2022-04-03 07:58:15.262 [rank:4] [train], epoch: 10/50, iter: 400/834, loss: 0.36832, lr: 1.375441, top1: 0.52641, throughput: 312.92 | 2022-04-03 07:58:15.272 [rank:3] [train], epoch: 10/50, iter: 400/834, loss: 0.36544, lr: 1.375441, top1: 0.52969, throughput: 313.20 | 2022-04-03 07:58:15.275 [rank:0] [train], epoch: 10/50, iter: 400/834, loss: 0.36583, lr: 1.375441, top1: 0.53073, throughput: 312.88 | 2022-04-03 07:58:15.285 [rank:0] [train], epoch: 10/50, iter: 500/834, loss: 0.36757, lr: 1.371884, top1: 0.52937, throughput: 312.25 | 2022-04-03 07:59:16.773 [rank:7] [train], epoch: 10/50, iter: 500/834, loss: 0.36861, lr: 1.371884, top1: 0.52344, throughput: 311.99 | 2022-04-03 07:59:16.775 [rank:2] [train], epoch: 10/50, iter: 500/834, loss: 0.36751, lr: 1.371884, top1: 0.52641, throughput: 311.89 | 2022-04-03 07:59:16.784 [rank:4] [train], epoch: 10/50, iter: 500/834, loss: 0.36898, lr: 1.371884, top1: 0.51932, throughput: 312.07 | 2022-04-03 07:59:16.796 [rank:5] [train], epoch: 10/50, iter: 500/834, loss: 0.36778, lr: 1.371884, top1: 0.52995, throughput: 312.00 | 2022-04-03 07:59:16.800 [rank:1] [train], epoch: 10/50, iter: 500/834, loss: 0.36472, lr: 1.371884, top1: 0.52906, throughput: 311.80 | 2022-04-03 07:59:16.820 [rank:3] [train], epoch: 10/50, iter: 500/834, loss: 0.36880, lr: 1.371884, top1: 0.52380, throughput: 311.91 | 2022-04-03 07:59:16.832 [rank:6] [train], epoch: 10/50, iter: 500/834, loss: 0.36777, lr: 1.371884, top1: 0.52568, throughput: 312.17 | 2022-04-03 07:59:16.754 [rank:5] [train], epoch: 10/50, iter: 600/834, loss: 0.36646, lr: 1.368292, top1: 0.53021, throughput: 312.74 | 2022-04-03 08:00:18.194 [rank:7] [train], epoch: 10/50, iter: 600/834, loss: 0.36752, lr: 1.368292, top1: 0.52891, throughput: 312.55 | 2022-04-03 08:00:18.206 [rank:4] [train], epoch: 10/50, iter: 600/834, loss: 0.36678, lr: 1.368292, top1: 0.52682, throughput: 312.47 | 2022-04-03 08:00:18.243 [rank:6] [train], epoch: 10/50, iter: 600/834, loss: 0.36688, lr: 1.368292, top1: 0.53135, throughput: 312.23 | 2022-04-03 08:00:18.248 [rank:0] [train], epoch: 10/50, iter: 600/834, loss: 0.36715, lr: 1.368292, top1: 0.52406, throughput: 312.30 | 2022-04-03 08:00:18.252 [rank:2] [train], epoch: 10/50, iter: 600/834, loss: 0.36792, lr: 1.368292, top1: 0.52406, throughput: 312.32 | 2022-04-03 08:00:18.260 [rank:3] [train], epoch: 10/50, iter: 600/834, loss: 0.36406, lr: 1.368292, top1: 0.53396, throughput: 312.56 | 2022-04-03 08:00:18.260 [rank:1] [train], epoch: 10/50, iter: 600/834, loss: 0.36653, lr: 1.368292, top1: 0.52495, throughput: 312.81 | 2022-04-03 08:00:18.199 [rank:1] [train], epoch: 10/50, iter: 700/834, loss: 0.36573, lr: 1.364666, top1: 0.52964, throughput: 313.46 | 2022-04-03 08:01:19.450 [rank:7] [train], epoch: 10/50, iter: 700/834, loss: 0.37035, lr: 1.364666, top1: 0.52734, throughput: 313.45 | 2022-04-03 08:01:19.459 [rank:5] [train], epoch: 10/50, iter: 700/834, loss: 0.36606, lr: 1.364666, top1: 0.52849, throughput: 313.36 | 2022-04-03 08:01:19.465 [rank:6] [train], epoch: 10/50, iter: 700/834, loss: 0.37014, lr: 1.364666, top1: 0.51938, throughput: 313.58 | 2022-04-03 08:01:19.475 [rank:2] [train], epoch: 10/50, iter: 700/834, loss: 0.36601, lr: 1.364666, top1: 0.52792, throughput: 313.63 | 2022-04-03 08:01:19.478 [rank:4] [train], epoch: 10/50, iter: 700/834, loss: 0.36945, lr: 1.364666, top1: 0.52500, throughput: 313.44 | 2022-04-03 08:01:19.500 [rank:3] [train], epoch: 10/50, iter: 700/834, loss: 0.36680, lr: 1.364666, top1: 0.52620, throughput: 313.52 | 2022-04-03 08:01:19.500 [rank:0] [train], epoch: 10/50, iter: 700/834, loss: 0.36811, lr: 1.364666, top1: 0.52307, throughput: 313.29 | 2022-04-03 08:01:19.536 [rank:3] [train], epoch: 10/50, iter: 800/834, loss: 0.36633, lr: 1.361006, top1: 0.52552, throughput: 312.32 | 2022-04-03 08:02:20.976 [rank:1] [train], epoch: 10/50, iter: 800/834, loss: 0.36553, lr: 1.361006, top1: 0.53318, throughput: 311.89 | 2022-04-03 08:02:21.010 [rank:7] [train], epoch: 10/50, iter: 800/834, loss: 0.36621, lr: 1.361006, top1: 0.52776, throughput: 311.92 | 2022-04-03 08:02:21.013 [rank:6] [train], epoch: 10/50, iter: 800/834, loss: 0.36568, lr: 1.361006, top1: 0.53193, throughput: 312.00 | 2022-04-03 08:02:21.013 [rank:0] [train], epoch: 10/50, iter: 800/834, loss: 0.36711, lr: 1.361006, top1: 0.52786, throughput: 312.20 | 2022-04-03 08:02:21.034 [rank:4] [train], epoch: 10/50, iter: 800/834, loss: 0.36832, lr: 1.361006, top1: 0.52594, throughput: 311.88 | 2022-04-03 08:02:21.062 [rank:2] [train], epoch: 10/50, iter: 800/834, loss: 0.36734, lr: 1.361006, top1: 0.52557, throughput: 311.75 | 2022-04-03 08:02:21.066 [rank:5] [train], epoch: 10/50, iter: 800/834, loss: 0.36368, lr: 1.361006, top1: 0.53401, throughput: 311.60 | 2022-04-03 08:02:21.082 [rank:6] [train], epoch: 10/50, iter: 834/834, loss: 0.36596, lr: 1.359754, top1: 0.52374, throughput: 311.38 | 2022-04-03 08:02:41.978 [rank:1] [train], epoch: 10/50, iter: 834/834, loss: 0.36331, lr: 1.359754, top1: 0.52834, throughput: 311.31 | 2022-04-03 08:02:41.980 [rank:7] [train], epoch: 10/50, iter: 834/834, loss: 0.36491, lr: 1.359754, top1: 0.53018, throughput: 311.34 | 2022-04-03 08:02:41.981 [rank:4] [train], epoch: 10/50, iter: 834/834, loss: 0.36651, lr: 1.359754, top1: 0.52834, throughput: 312.04 | 2022-04-03 08:02:41.982 [rank:2] [train], epoch: 10/50, iter: 834/834, loss: 0.36248, lr: 1.359754, top1: 0.52497, throughput: 311.88 | 2022-04-03 08:02:41.997 [rank:3] [train], epoch: 10/50, iter: 834/834, loss: 0.36386, lr: 1.359754, top1: 0.53309, throughput: 310.51 | 2022-04-03 08:02:41.999 [rank:5] [train], epoch: 10/50, iter: 834/834, loss: 0.36725, lr: 1.359754, top1: 0.52558, throughput: 311.66 | 2022-04-03 08:02:42.028 [rank:0] [train], epoch: 10/50, iter: 834/834, loss: 0.36367, lr: 1.359754, top1: 0.53784, throughput: 310.61 | 2022-04-03 08:02:42.051 [rank:0] [eval], epoch: 10/50, iter: 125/125, loss: 0.00000, lr: 1.359754, top1: 0.53920, throughput: 486.42 | 2022-04-03 08:02:54.900 [rank:7] [eval], epoch: 10/50, iter: 125/125, loss: 0.00000, lr: 1.359754, top1: 0.53232, throughput: 483.48 | 2022-04-03 08:02:54.908 [rank:6] [eval], epoch: 10/50, iter: 125/125, loss: 0.00000, lr: 1.359754, top1: 0.53488, throughput: 483.16 | 2022-04-03 08:02:54.914 [rank:4] [eval], epoch: 10/50, iter: 125/125, loss: 0.00000, lr: 1.359754, top1: 0.53600, throughput: 483.28 | 2022-04-03 08:02:54.914 [rank:5] [eval], epoch: 10/50, iter: 125/125, loss: 0.00000, lr: 1.359754, top1: 0.52928, throughput: 484.99 | 2022-04-03 08:02:54.915 [rank:2] [eval], epoch: 10/50, iter: 125/125, loss: 0.00000, lr: 1.359754, top1: 0.54096, throughput: 483.61 | 2022-04-03 08:02:54.921 [rank:1] [eval], epoch: 10/50, iter: 125/125, loss: 0.00000, lr: 1.359754, top1: 0.54688, throughput: 481.83 | 2022-04-03 08:02:54.951 [rank:3] [eval], epoch: 10/50, iter: 125/125, loss: 0.00000, lr: 1.359754, top1: 0.52640, throughput: 482.54 | 2022-04-03 08:02:54.951 [rank:7] [train], epoch: 11/50, iter: 100/834, loss: 0.36031, lr: 1.356049, top1: 0.54260, throughput: 311.85 | 2022-04-03 08:03:56.477 [rank:5] [train], epoch: 11/50, iter: 100/834, loss: 0.36233, lr: 1.356049, top1: 0.53526, throughput: 311.86 | 2022-04-03 08:03:56.481 [rank:0] [train], epoch: 11/50, iter: 100/834, loss: 0.35814, lr: 1.356049, top1: 0.54859, throughput: 311.72 | 2022-04-03 08:03:56.494 [rank:6] [train], epoch: 11/50, iter: 100/834, loss: 0.35943, lr: 1.356049, top1: 0.54089, throughput: 311.76 | 2022-04-03 08:03:56.501 [rank:1] [train], epoch: 11/50, iter: 100/834, loss: 0.36229, lr: 1.356049, top1: 0.53469, throughput: 311.87 | 2022-04-03 08:03:56.516 [rank:3] [train], epoch: 11/50, iter: 100/834, loss: 0.36391, lr: 1.356049, top1: 0.53557, throughput: 311.81 | 2022-04-03 08:03:56.527 [rank:2] [train], epoch: 11/50, iter: 100/834, loss: 0.36253, lr: 1.356049, top1: 0.53891, throughput: 311.62 | 2022-04-03 08:03:56.535 [rank:4] [train], epoch: 11/50, iter: 100/834, loss: 0.35983, lr: 1.356049, top1: 0.53693, throughput: 311.56 | 2022-04-03 08:03:56.539 [rank:7] [train], epoch: 11/50, iter: 200/834, loss: 0.36042, lr: 1.352311, top1: 0.54115, throughput: 312.29 | 2022-04-03 08:04:57.958 [rank:6] [train], epoch: 11/50, iter: 200/834, loss: 0.36353, lr: 1.352311, top1: 0.53443, throughput: 312.33 | 2022-04-03 08:04:57.973 [rank:2] [train], epoch: 11/50, iter: 200/834, loss: 0.35432, lr: 1.352311, top1: 0.55068, throughput: 312.44 | 2022-04-03 08:04:57.987 [rank:5] [train], epoch: 11/50, iter: 200/834, loss: 0.36277, lr: 1.352311, top1: 0.53646, throughput: 312.13 | 2022-04-03 08:04:57.994 [rank:4] [train], epoch: 11/50, iter: 200/834, loss: 0.36365, lr: 1.352311, top1: 0.53427, throughput: 312.40 | 2022-04-03 08:04:57.999 [rank:3] [train], epoch: 11/50, iter: 200/834, loss: 0.36053, lr: 1.352311, top1: 0.54062, throughput: 312.33 | 2022-04-03 08:04:58.000 [rank:0] [train], epoch: 11/50, iter: 200/834, loss: 0.36025, lr: 1.352311, top1: 0.54057, throughput: 312.15 | 2022-04-03 08:04:58.004 [rank:1] [train], epoch: 11/50, iter: 200/834, loss: 0.35862, lr: 1.352311, top1: 0.54328, throughput: 312.03 | 2022-04-03 08:04:58.049 [rank:4] [train], epoch: 11/50, iter: 300/834, loss: 0.36192, lr: 1.348540, top1: 0.53958, throughput: 311.84 | 2022-04-03 08:05:59.568 [rank:2] [train], epoch: 11/50, iter: 300/834, loss: 0.36289, lr: 1.348540, top1: 0.53661, throughput: 311.68 | 2022-04-03 08:05:59.588 [rank:7] [train], epoch: 11/50, iter: 300/834, loss: 0.36274, lr: 1.348540, top1: 0.53932, throughput: 311.51 | 2022-04-03 08:05:59.593 [rank:5] [train], epoch: 11/50, iter: 300/834, loss: 0.35855, lr: 1.348540, top1: 0.53948, throughput: 311.49 | 2022-04-03 08:05:59.634 [rank:6] [train], epoch: 11/50, iter: 300/834, loss: 0.36133, lr: 1.348540, top1: 0.53937, throughput: 311.38 | 2022-04-03 08:05:59.635 [rank:0] [train], epoch: 11/50, iter: 300/834, loss: 0.36090, lr: 1.348540, top1: 0.53948, throughput: 311.49 | 2022-04-03 08:05:59.642 [rank:3] [train], epoch: 11/50, iter: 300/834, loss: 0.35961, lr: 1.348540, top1: 0.54109, throughput: 311.45 | 2022-04-03 08:05:59.647 [rank:1] [train], epoch: 11/50, iter: 300/834, loss: 0.36320, lr: 1.348540, top1: 0.53401, throughput: 311.55 | 2022-04-03 08:05:59.675 [rank:6] [train], epoch: 11/50, iter: 400/834, loss: 0.36244, lr: 1.344735, top1: 0.53016, throughput: 313.27 | 2022-04-03 08:07:00.923 [rank:7] [train], epoch: 11/50, iter: 400/834, loss: 0.36125, lr: 1.344735, top1: 0.53745, throughput: 313.02 | 2022-04-03 08:07:00.930 [rank:3] [train], epoch: 11/50, iter: 400/834, loss: 0.36405, lr: 1.344735, top1: 0.53484, throughput: 313.26 | 2022-04-03 08:07:00.937 [rank:1] [train], epoch: 11/50, iter: 400/834, loss: 0.36338, lr: 1.344735, top1: 0.53396, throughput: 313.38 | 2022-04-03 08:07:00.944 [rank:5] [train], epoch: 11/50, iter: 400/834, loss: 0.36034, lr: 1.344735, top1: 0.53844, throughput: 313.17 | 2022-04-03 08:07:00.944 [rank:4] [train], epoch: 11/50, iter: 400/834, loss: 0.36268, lr: 1.344735, top1: 0.53583, throughput: 312.72 | 2022-04-03 08:07:00.966 [rank:2] [train], epoch: 11/50, iter: 400/834, loss: 0.36325, lr: 1.344735, top1: 0.53229, throughput: 312.67 | 2022-04-03 08:07:00.995 [rank:0] [train], epoch: 11/50, iter: 400/834, loss: 0.35896, lr: 1.344735, top1: 0.53859, throughput: 312.94 | 2022-04-03 08:07:00.995 [rank:4] [train], epoch: 11/50, iter: 500/834, loss: 0.36337, lr: 1.340898, top1: 0.53547, throughput: 311.64 | 2022-04-03 08:08:02.575 [rank:3] [train], epoch: 11/50, iter: 500/834, loss: 0.36213, lr: 1.340898, top1: 0.53672, throughput: 311.44 | 2022-04-03 08:08:02.587 [rank:1] [train], epoch: 11/50, iter: 500/834, loss: 0.36009, lr: 1.340898, top1: 0.54385, throughput: 311.43 | 2022-04-03 08:08:02.594 [rank:2] [train], epoch: 11/50, iter: 500/834, loss: 0.36234, lr: 1.340898, top1: 0.52958, throughput: 311.57 | 2022-04-03 08:08:02.618 [rank:5] [train], epoch: 11/50, iter: 500/834, loss: 0.36077, lr: 1.340898, top1: 0.54339, throughput: 311.24 | 2022-04-03 08:08:02.632 [rank:6] [train], epoch: 11/50, iter: 500/834, loss: 0.36248, lr: 1.340898, top1: 0.53297, throughput: 311.11 | 2022-04-03 08:08:02.638 [rank:0] [train], epoch: 11/50, iter: 500/834, loss: 0.36230, lr: 1.340898, top1: 0.53828, throughput: 311.47 | 2022-04-03 08:08:02.639 [rank:7] [train], epoch: 11/50, iter: 500/834, loss: 0.35910, lr: 1.340898, top1: 0.54536, throughput: 311.49 | 2022-04-03 08:08:02.570 [rank:7] [train], epoch: 11/50, iter: 600/834, loss: 0.36032, lr: 1.337029, top1: 0.53755, throughput: 312.02 | 2022-04-03 08:09:04.104 [rank:6] [train], epoch: 11/50, iter: 600/834, loss: 0.36042, lr: 1.337029, top1: 0.54604, throughput: 312.37 | 2022-04-03 08:09:04.104 [rank:3] [train], epoch: 11/50, iter: 600/834, loss: 0.36122, lr: 1.337029, top1: 0.53469, throughput: 312.06 | 2022-04-03 08:09:04.114 [rank:2] [train], epoch: 11/50, iter: 600/834, loss: 0.35791, lr: 1.337029, top1: 0.54349, throughput: 312.10 | 2022-04-03 08:09:04.136 [rank:0] [train], epoch: 11/50, iter: 600/834, loss: 0.36031, lr: 1.337029, top1: 0.53594, throughput: 312.19 | 2022-04-03 08:09:04.141 [rank:4] [train], epoch: 11/50, iter: 600/834, loss: 0.36003, lr: 1.337029, top1: 0.53937, throughput: 311.81 | 2022-04-03 08:09:04.150 [rank:5] [train], epoch: 11/50, iter: 600/834, loss: 0.36058, lr: 1.337029, top1: 0.53604, throughput: 312.01 | 2022-04-03 08:09:04.169 [rank:1] [train], epoch: 11/50, iter: 600/834, loss: 0.36139, lr: 1.337029, top1: 0.54141, throughput: 311.72 | 2022-04-03 08:09:04.187 [rank:2] [train], epoch: 11/50, iter: 700/834, loss: 0.36168, lr: 1.333127, top1: 0.54094, throughput: 313.22 | 2022-04-03 08:10:05.435 [rank:7] [train], epoch: 11/50, iter: 700/834, loss: 0.36188, lr: 1.333127, top1: 0.53594, throughput: 312.93 | 2022-04-03 08:10:05.461 [rank:0] [train], epoch: 11/50, iter: 700/834, loss: 0.36189, lr: 1.333127, top1: 0.53771, throughput: 313.07 | 2022-04-03 08:10:05.469 [rank:4] [train], epoch: 11/50, iter: 700/834, loss: 0.36120, lr: 1.333127, top1: 0.54172, throughput: 313.08 | 2022-04-03 08:10:05.477 [rank:6] [train], epoch: 11/50, iter: 700/834, loss: 0.35608, lr: 1.333127, top1: 0.54380, throughput: 312.81 | 2022-04-03 08:10:05.483 [rank:5] [train], epoch: 11/50, iter: 700/834, loss: 0.36242, lr: 1.333127, top1: 0.53406, throughput: 313.14 | 2022-04-03 08:10:05.484 [rank:3] [train], epoch: 11/50, iter: 700/834, loss: 0.36125, lr: 1.333127, top1: 0.53469, throughput: 312.80 | 2022-04-03 08:10:05.495 [rank:1] [train], epoch: 11/50, iter: 700/834, loss: 0.36137, lr: 1.333127, top1: 0.53708, throughput: 312.84 | 2022-04-03 08:10:05.559 [rank:2] [train], epoch: 11/50, iter: 800/834, loss: 0.36467, lr: 1.329193, top1: 0.53333, throughput: 310.94 | 2022-04-03 08:11:07.184 [rank:6] [train], epoch: 11/50, iter: 800/834, loss: 0.36095, lr: 1.329193, top1: 0.54219, throughput: 310.88 | 2022-04-03 08:11:07.242 [rank:4] [train], epoch: 11/50, iter: 800/834, loss: 0.36084, lr: 1.329193, top1: 0.53464, throughput: 310.80 | 2022-04-03 08:11:07.253 [rank:1] [train], epoch: 11/50, iter: 800/834, loss: 0.36171, lr: 1.329193, top1: 0.53833, throughput: 311.12 | 2022-04-03 08:11:07.271 [rank:5] [train], epoch: 11/50, iter: 800/834, loss: 0.36297, lr: 1.329193, top1: 0.53130, throughput: 310.70 | 2022-04-03 08:11:07.280 [rank:3] [train], epoch: 11/50, iter: 800/834, loss: 0.36225, lr: 1.329193, top1: 0.53615, throughput: 310.73 | 2022-04-03 08:11:07.286 [rank:0] [train], epoch: 11/50, iter: 800/834, loss: 0.36244, lr: 1.329193, top1: 0.52807, throughput: 310.58 | 2022-04-03 08:11:07.289 [rank:7] [train], epoch: 11/50, iter: 800/834, loss: 0.36124, lr: 1.329193, top1: 0.54036, throughput: 310.91 | 2022-04-03 08:11:07.215 [rank:5] [train], epoch: 11/50, iter: 834/834, loss: 0.36212, lr: 1.327848, top1: 0.53922, throughput: 310.64 | 2022-04-03 08:11:28.294 [rank:3] [train], epoch: 11/50, iter: 834/834, loss: 0.36156, lr: 1.327848, top1: 0.53768, throughput: 310.59 | 2022-04-03 08:11:28.304 [rank:4] [train], epoch: 11/50, iter: 834/834, loss: 0.36020, lr: 1.327848, top1: 0.54550, throughput: 309.97 | 2022-04-03 08:11:28.313 [rank:6] [train], epoch: 11/50, iter: 834/834, loss: 0.36079, lr: 1.327848, top1: 0.53768, throughput: 309.80 | 2022-04-03 08:11:28.313 [rank:0] [train], epoch: 11/50, iter: 834/834, loss: 0.36064, lr: 1.327848, top1: 0.53830, throughput: 310.45 | 2022-04-03 08:11:28.316 [rank:1] [train], epoch: 11/50, iter: 834/834, loss: 0.35194, lr: 1.327848, top1: 0.55316, throughput: 310.13 | 2022-04-03 08:11:28.320 [rank:2] [train], epoch: 11/50, iter: 834/834, loss: 0.35867, lr: 1.327848, top1: 0.54841, throughput: 308.84 | 2022-04-03 08:11:28.321 [rank:7] [train], epoch: 11/50, iter: 834/834, loss: 0.36086, lr: 1.327848, top1: 0.53661, throughput: 308.81 | 2022-04-03 08:11:28.354 [rank:0] [eval], epoch: 11/50, iter: 125/125, loss: 0.00000, lr: 1.327848, top1: 0.55056, throughput: 484.13 | 2022-04-03 08:11:41.226 [rank:4] [eval], epoch: 11/50, iter: 125/125, loss: 0.00000, lr: 1.327848, top1: 0.54480, throughput: 483.98 | 2022-04-03 08:11:41.227 [rank:5] [eval], epoch: 11/50, iter: 125/125, loss: 0.00000, lr: 1.327848, top1: 0.53600, throughput: 483.18 | 2022-04-03 08:11:41.229 [rank:7] [eval], epoch: 11/50, iter: 125/125, loss: 0.00000, lr: 1.327848, top1: 0.54064, throughput: 485.29 | 2022-04-03 08:11:41.233 [rank:6] [eval], epoch: 11/50, iter: 125/125, loss: 0.00000, lr: 1.327848, top1: 0.54304, throughput: 483.60 | 2022-04-03 08:11:41.237 [rank:3] [eval], epoch: 11/50, iter: 125/125, loss: 0.00000, lr: 1.327848, top1: 0.54128, throughput: 483.05 | 2022-04-03 08:11:41.243 [rank:2] [eval], epoch: 11/50, iter: 125/125, loss: 0.00000, lr: 1.327848, top1: 0.53760, throughput: 483.29 | 2022-04-03 08:11:41.253 [rank:1] [eval], epoch: 11/50, iter: 125/125, loss: 0.00000, lr: 1.327848, top1: 0.54656, throughput: 482.40 | 2022-04-03 08:11:41.276 [rank:2] [train], epoch: 12/50, iter: 100/834, loss: 0.35430, lr: 1.323871, top1: 0.55286, throughput: 312.33 | 2022-04-03 08:12:42.726 [rank:7] [train], epoch: 12/50, iter: 100/834, loss: 0.35522, lr: 1.323871, top1: 0.54885, throughput: 312.16 | 2022-04-03 08:12:42.739 [rank:0] [train], epoch: 12/50, iter: 100/834, loss: 0.35646, lr: 1.323871, top1: 0.54755, throughput: 312.08 | 2022-04-03 08:12:42.749 [rank:6] [train], epoch: 12/50, iter: 100/834, loss: 0.35656, lr: 1.323871, top1: 0.54490, throughput: 312.09 | 2022-04-03 08:12:42.758 [rank:3] [train], epoch: 12/50, iter: 100/834, loss: 0.35383, lr: 1.323871, top1: 0.55026, throughput: 312.08 | 2022-04-03 08:12:42.765 [rank:1] [train], epoch: 12/50, iter: 100/834, loss: 0.35288, lr: 1.323871, top1: 0.55391, throughput: 312.22 | 2022-04-03 08:12:42.771 [rank:5] [train], epoch: 12/50, iter: 100/834, loss: 0.35233, lr: 1.323871, top1: 0.55260, throughput: 312.36 | 2022-04-03 08:12:42.698 [rank:4] [train], epoch: 12/50, iter: 100/834, loss: 0.35706, lr: 1.323871, top1: 0.54328, throughput: 311.88 | 2022-04-03 08:12:42.789 [rank:0] [train], epoch: 12/50, iter: 200/834, loss: 0.35444, lr: 1.319863, top1: 0.55094, throughput: 312.27 | 2022-04-03 08:13:44.234 [rank:1] [train], epoch: 12/50, iter: 200/834, loss: 0.35597, lr: 1.319863, top1: 0.54495, throughput: 312.14 | 2022-04-03 08:13:44.281 [rank:4] [train], epoch: 12/50, iter: 200/834, loss: 0.35312, lr: 1.319863, top1: 0.55198, throughput: 312.11 | 2022-04-03 08:13:44.306 [rank:5] [train], epoch: 12/50, iter: 200/834, loss: 0.35911, lr: 1.319863, top1: 0.54323, throughput: 311.64 | 2022-04-03 08:13:44.308 [rank:2] [train], epoch: 12/50, iter: 200/834, loss: 0.35655, lr: 1.319863, top1: 0.54849, throughput: 311.78 | 2022-04-03 08:13:44.308 [rank:6] [train], epoch: 12/50, iter: 200/834, loss: 0.35674, lr: 1.319863, top1: 0.54505, throughput: 311.94 | 2022-04-03 08:13:44.309 [rank:7] [train], epoch: 12/50, iter: 200/834, loss: 0.35789, lr: 1.319863, top1: 0.54505, throughput: 311.82 | 2022-04-03 08:13:44.313 [rank:3] [train], epoch: 12/50, iter: 200/834, loss: 0.35740, lr: 1.319863, top1: 0.54740, throughput: 311.87 | 2022-04-03 08:13:44.329 [rank:3] [train], epoch: 12/50, iter: 300/834, loss: 0.35665, lr: 1.315824, top1: 0.55078, throughput: 311.07 | 2022-04-03 08:14:46.052 [rank:1] [train], epoch: 12/50, iter: 300/834, loss: 0.35778, lr: 1.315824, top1: 0.54781, throughput: 310.79 | 2022-04-03 08:14:46.058 [rank:5] [train], epoch: 12/50, iter: 300/834, loss: 0.35556, lr: 1.315824, top1: 0.55026, throughput: 310.89 | 2022-04-03 08:14:46.066 [rank:7] [train], epoch: 12/50, iter: 300/834, loss: 0.35793, lr: 1.315824, top1: 0.54500, throughput: 310.83 | 2022-04-03 08:14:46.084 [rank:4] [train], epoch: 12/50, iter: 300/834, loss: 0.36062, lr: 1.315824, top1: 0.53495, throughput: 310.64 | 2022-04-03 08:14:46.114 [rank:2] [train], epoch: 12/50, iter: 300/834, loss: 0.35865, lr: 1.315824, top1: 0.54068, throughput: 310.99 | 2022-04-03 08:14:46.046 [rank:0] [train], epoch: 12/50, iter: 300/834, loss: 0.35528, lr: 1.315824, top1: 0.55130, throughput: 310.14 | 2022-04-03 08:14:46.141 [rank:6] [train], epoch: 12/50, iter: 300/834, loss: 0.35705, lr: 1.315824, top1: 0.54312, throughput: 310.92 | 2022-04-03 08:14:46.061 [rank:3] [train], epoch: 12/50, iter: 400/834, loss: 0.35585, lr: 1.311753, top1: 0.54760, throughput: 314.48 | 2022-04-03 08:15:47.105 [rank:1] [train], epoch: 12/50, iter: 400/834, loss: 0.35437, lr: 1.311753, top1: 0.54906, throughput: 314.48 | 2022-04-03 08:15:47.111 [rank:7] [train], epoch: 12/50, iter: 400/834, loss: 0.35740, lr: 1.311753, top1: 0.54510, throughput: 314.60 | 2022-04-03 08:15:47.114 [rank:2] [train], epoch: 12/50, iter: 400/834, loss: 0.35971, lr: 1.311753, top1: 0.54109, throughput: 314.32 | 2022-04-03 08:15:47.130 [rank:4] [train], epoch: 12/50, iter: 400/834, loss: 0.35524, lr: 1.311753, top1: 0.54990, throughput: 314.52 | 2022-04-03 08:15:47.159 [rank:0] [train], epoch: 12/50, iter: 400/834, loss: 0.35520, lr: 1.311753, top1: 0.54427, throughput: 314.61 | 2022-04-03 08:15:47.169 [rank:5] [train], epoch: 12/50, iter: 400/834, loss: 0.35379, lr: 1.311753, top1: 0.54776, throughput: 314.20 | 2022-04-03 08:15:47.174 [rank:6] [train], epoch: 12/50, iter: 400/834, loss: 0.35578, lr: 1.311753, top1: 0.54812, throughput: 314.09 | 2022-04-03 08:15:47.190 [rank:7] [train], epoch: 12/50, iter: 500/834, loss: 0.35706, lr: 1.307652, top1: 0.54495, throughput: 312.98 | 2022-04-03 08:16:48.460 [rank:3] [train], epoch: 12/50, iter: 500/834, loss: 0.35864, lr: 1.307652, top1: 0.54177, throughput: 312.93 | 2022-04-03 08:16:48.460 [rank:5] [train], epoch: 12/50, iter: 500/834, loss: 0.35501, lr: 1.307652, top1: 0.54807, throughput: 313.23 | 2022-04-03 08:16:48.471 [rank:0] [train], epoch: 12/50, iter: 500/834, loss: 0.35836, lr: 1.307652, top1: 0.54688, throughput: 313.15 | 2022-04-03 08:16:48.482 [rank:6] [train], epoch: 12/50, iter: 500/834, loss: 0.35835, lr: 1.307652, top1: 0.54245, throughput: 313.07 | 2022-04-03 08:16:48.518 [rank:4] [train], epoch: 12/50, iter: 500/834, loss: 0.35594, lr: 1.307652, top1: 0.54849, throughput: 313.29 | 2022-04-03 08:16:48.444 [rank:2] [train], epoch: 12/50, iter: 500/834, loss: 0.35539, lr: 1.307652, top1: 0.54620, throughput: 312.68 | 2022-04-03 08:16:48.534 [rank:1] [train], epoch: 12/50, iter: 500/834, loss: 0.35736, lr: 1.307652, top1: 0.54552, throughput: 312.51 | 2022-04-03 08:16:48.549 [rank:3] [train], epoch: 12/50, iter: 600/834, loss: 0.35665, lr: 1.303520, top1: 0.54339, throughput: 313.54 | 2022-04-03 08:17:49.696 [rank:6] [train], epoch: 12/50, iter: 600/834, loss: 0.35663, lr: 1.303520, top1: 0.54458, throughput: 313.70 | 2022-04-03 08:17:49.724 [rank:7] [train], epoch: 12/50, iter: 600/834, loss: 0.35609, lr: 1.303520, top1: 0.54833, throughput: 313.39 | 2022-04-03 08:17:49.726 [rank:2] [train], epoch: 12/50, iter: 600/834, loss: 0.35722, lr: 1.303520, top1: 0.54750, throughput: 313.76 | 2022-04-03 08:17:49.728 [rank:1] [train], epoch: 12/50, iter: 600/834, loss: 0.35768, lr: 1.303520, top1: 0.54620, throughput: 313.82 | 2022-04-03 08:17:49.731 [rank:4] [train], epoch: 12/50, iter: 600/834, loss: 0.35745, lr: 1.303520, top1: 0.54615, throughput: 313.26 | 2022-04-03 08:17:49.735 [rank:0] [train], epoch: 12/50, iter: 600/834, loss: 0.35773, lr: 1.303520, top1: 0.54432, throughput: 313.45 | 2022-04-03 08:17:49.735 [rank:5] [train], epoch: 12/50, iter: 600/834, loss: 0.36180, lr: 1.303520, top1: 0.53740, throughput: 313.62 | 2022-04-03 08:17:49.692 [rank:3] [train], epoch: 12/50, iter: 700/834, loss: 0.35713, lr: 1.299357, top1: 0.54839, throughput: 313.18 | 2022-04-03 08:18:51.003 [rank:4] [train], epoch: 12/50, iter: 700/834, loss: 0.36074, lr: 1.299357, top1: 0.53698, throughput: 313.37 | 2022-04-03 08:18:51.004 [rank:7] [train], epoch: 12/50, iter: 700/834, loss: 0.35623, lr: 1.299357, top1: 0.54896, throughput: 313.14 | 2022-04-03 08:18:51.040 [rank:6] [train], epoch: 12/50, iter: 700/834, loss: 0.35957, lr: 1.299357, top1: 0.53807, throughput: 313.12 | 2022-04-03 08:18:51.042 [rank:5] [train], epoch: 12/50, iter: 700/834, loss: 0.35892, lr: 1.299357, top1: 0.54198, throughput: 312.95 | 2022-04-03 08:18:51.044 [rank:2] [train], epoch: 12/50, iter: 700/834, loss: 0.35839, lr: 1.299357, top1: 0.54115, throughput: 313.13 | 2022-04-03 08:18:51.044 [rank:0] [train], epoch: 12/50, iter: 700/834, loss: 0.35621, lr: 1.299357, top1: 0.54589, throughput: 313.12 | 2022-04-03 08:18:51.053 [rank:1] [train], epoch: 12/50, iter: 700/834, loss: 0.35479, lr: 1.299357, top1: 0.55109, throughput: 313.44 | 2022-04-03 08:18:50.986 [rank:0] [train], epoch: 12/50, iter: 800/834, loss: 0.35824, lr: 1.295164, top1: 0.54422, throughput: 312.10 | 2022-04-03 08:19:52.572 [rank:7] [train], epoch: 12/50, iter: 800/834, loss: 0.35864, lr: 1.295164, top1: 0.54141, throughput: 312.01 | 2022-04-03 08:19:52.576 [rank:3] [train], epoch: 12/50, iter: 800/834, loss: 0.35931, lr: 1.295164, top1: 0.53766, throughput: 311.70 | 2022-04-03 08:19:52.601 [rank:2] [train], epoch: 12/50, iter: 800/834, loss: 0.35531, lr: 1.295164, top1: 0.54854, throughput: 311.90 | 2022-04-03 08:19:52.602 [rank:6] [train], epoch: 12/50, iter: 800/834, loss: 0.35974, lr: 1.295164, top1: 0.54057, throughput: 311.87 | 2022-04-03 08:19:52.606 [rank:1] [train], epoch: 12/50, iter: 800/834, loss: 0.35698, lr: 1.295164, top1: 0.54844, throughput: 311.48 | 2022-04-03 08:19:52.627 [rank:5] [train], epoch: 12/50, iter: 800/834, loss: 0.35476, lr: 1.295164, top1: 0.54911, throughput: 311.73 | 2022-04-03 08:19:52.635 [rank:4] [train], epoch: 12/50, iter: 800/834, loss: 0.35501, lr: 1.295164, top1: 0.54885, throughput: 311.47 | 2022-04-03 08:19:52.647 [rank:6] [train], epoch: 12/50, iter: 834/834, loss: 0.35998, lr: 1.293732, top1: 0.54534, throughput: 312.49 | 2022-04-03 08:20:13.496 [rank:3] [train], epoch: 12/50, iter: 834/834, loss: 0.35569, lr: 1.293732, top1: 0.54182, throughput: 312.39 | 2022-04-03 08:20:13.497 [rank:7] [train], epoch: 12/50, iter: 834/834, loss: 0.35897, lr: 1.293732, top1: 0.54121, throughput: 311.94 | 2022-04-03 08:20:13.504 [rank:5] [train], epoch: 12/50, iter: 834/834, loss: 0.35698, lr: 1.293732, top1: 0.53814, throughput: 312.79 | 2022-04-03 08:20:13.506 [rank:1] [train], epoch: 12/50, iter: 834/834, loss: 0.35841, lr: 1.293732, top1: 0.53998, throughput: 312.64 | 2022-04-03 08:20:13.507 [rank:2] [train], epoch: 12/50, iter: 834/834, loss: 0.36193, lr: 1.293732, top1: 0.52574, throughput: 312.15 | 2022-04-03 08:20:13.515 [rank:0] [train], epoch: 12/50, iter: 834/834, loss: 0.35972, lr: 1.293732, top1: 0.54550, throughput: 311.69 | 2022-04-03 08:20:13.516 [rank:4] [train], epoch: 12/50, iter: 834/834, loss: 0.35853, lr: 1.293732, top1: 0.54534, throughput: 312.23 | 2022-04-03 08:20:13.555 [rank:0] [eval], epoch: 12/50, iter: 125/125, loss: 0.00000, lr: 1.293732, top1: 0.53312, throughput: 487.43 | 2022-04-03 08:20:26.338 [rank:4] [eval], epoch: 12/50, iter: 125/125, loss: 0.00000, lr: 1.293732, top1: 0.52720, throughput: 488.86 | 2022-04-03 08:20:26.340 [rank:5] [eval], epoch: 12/50, iter: 125/125, loss: 0.00000, lr: 1.293732, top1: 0.51808, throughput: 486.53 | 2022-04-03 08:20:26.352 [rank:7] [eval], epoch: 12/50, iter: 125/125, loss: 0.00000, lr: 1.293732, top1: 0.53008, throughput: 486.36 | 2022-04-03 08:20:26.354 [rank:6] [eval], epoch: 12/50, iter: 125/125, loss: 0.00000, lr: 1.293732, top1: 0.52560, throughput: 485.52 | 2022-04-03 08:20:26.369 [rank:3] [eval], epoch: 12/50, iter: 125/125, loss: 0.00000, lr: 1.293732, top1: 0.52048, throughput: 485.44 | 2022-04-03 08:20:26.372 [rank:2] [eval], epoch: 12/50, iter: 125/125, loss: 0.00000, lr: 1.293732, top1: 0.51936, throughput: 486.09 | 2022-04-03 08:20:26.372 [rank:1] [eval], epoch: 12/50, iter: 125/125, loss: 0.00000, lr: 1.293732, top1: 0.53184, throughput: 485.29 | 2022-04-03 08:20:26.386 [rank:0] [train], epoch: 13/50, iter: 100/834, loss: 0.35406, lr: 1.289500, top1: 0.55057, throughput: 313.98 | 2022-04-03 08:21:27.490 [rank:1] [train], epoch: 13/50, iter: 100/834, loss: 0.34959, lr: 1.289500, top1: 0.55953, throughput: 314.11 | 2022-04-03 08:21:27.512 [rank:6] [train], epoch: 13/50, iter: 100/834, loss: 0.35205, lr: 1.289500, top1: 0.55333, throughput: 314.01 | 2022-04-03 08:21:27.514 [rank:5] [train], epoch: 13/50, iter: 100/834, loss: 0.35312, lr: 1.289500, top1: 0.56016, throughput: 313.90 | 2022-04-03 08:21:27.518 [rank:4] [train], epoch: 13/50, iter: 100/834, loss: 0.34859, lr: 1.289500, top1: 0.56120, throughput: 313.83 | 2022-04-03 08:21:27.519 [rank:2] [train], epoch: 13/50, iter: 100/834, loss: 0.35228, lr: 1.289500, top1: 0.55677, throughput: 313.96 | 2022-04-03 08:21:27.526 [rank:7] [train], epoch: 13/50, iter: 100/834, loss: 0.34833, lr: 1.289500, top1: 0.55979, throughput: 313.76 | 2022-04-03 08:21:27.547 [rank:3] [train], epoch: 13/50, iter: 100/834, loss: 0.34996, lr: 1.289500, top1: 0.55906, throughput: 314.27 | 2022-04-03 08:21:27.466 [rank:7] [train], epoch: 13/50, iter: 200/834, loss: 0.35033, lr: 1.285237, top1: 0.55635, throughput: 312.07 | 2022-04-03 08:22:29.071 [rank:4] [train], epoch: 13/50, iter: 200/834, loss: 0.35115, lr: 1.285237, top1: 0.55568, throughput: 311.93 | 2022-04-03 08:22:29.071 [rank:0] [train], epoch: 13/50, iter: 200/834, loss: 0.35343, lr: 1.285237, top1: 0.55052, throughput: 311.77 | 2022-04-03 08:22:29.073 [rank:3] [train], epoch: 13/50, iter: 200/834, loss: 0.35481, lr: 1.285237, top1: 0.54703, throughput: 311.64 | 2022-04-03 08:22:29.075 [rank:5] [train], epoch: 13/50, iter: 200/834, loss: 0.35092, lr: 1.285237, top1: 0.55516, throughput: 311.88 | 2022-04-03 08:22:29.080 [rank:1] [train], epoch: 13/50, iter: 200/834, loss: 0.35108, lr: 1.285237, top1: 0.55656, throughput: 311.84 | 2022-04-03 08:22:29.082 [rank:2] [train], epoch: 13/50, iter: 200/834, loss: 0.35043, lr: 1.285237, top1: 0.55583, throughput: 311.88 | 2022-04-03 08:22:29.089 [rank:6] [train], epoch: 13/50, iter: 200/834, loss: 0.35148, lr: 1.285237, top1: 0.55479, throughput: 312.18 | 2022-04-03 08:22:29.016 [rank:5] [train], epoch: 13/50, iter: 300/834, loss: 0.35203, lr: 1.280946, top1: 0.55641, throughput: 314.87 | 2022-04-03 08:23:30.057 [rank:4] [train], epoch: 13/50, iter: 300/834, loss: 0.35290, lr: 1.280946, top1: 0.55448, throughput: 314.78 | 2022-04-03 08:23:30.066 [rank:6] [train], epoch: 13/50, iter: 300/834, loss: 0.35399, lr: 1.280946, top1: 0.55271, throughput: 314.49 | 2022-04-03 08:23:30.068 [rank:0] [train], epoch: 13/50, iter: 300/834, loss: 0.35453, lr: 1.280946, top1: 0.54885, throughput: 314.72 | 2022-04-03 08:23:30.079 [rank:7] [train], epoch: 13/50, iter: 300/834, loss: 0.35262, lr: 1.280946, top1: 0.55385, throughput: 314.60 | 2022-04-03 08:23:30.100 [rank:3] [train], epoch: 13/50, iter: 300/834, loss: 0.35473, lr: 1.280946, top1: 0.55120, throughput: 314.59 | 2022-04-03 08:23:30.107 [rank:2] [train], epoch: 13/50, iter: 300/834, loss: 0.35373, lr: 1.280946, top1: 0.55156, throughput: 314.61 | 2022-04-03 08:23:30.117 [rank:1] [train], epoch: 13/50, iter: 300/834, loss: 0.35605, lr: 1.280946, top1: 0.54583, throughput: 314.37 | 2022-04-03 08:23:30.157 [rank:2] [train], epoch: 13/50, iter: 400/834, loss: 0.35299, lr: 1.276625, top1: 0.55089, throughput: 314.84 | 2022-04-03 08:24:31.099 [rank:0] [train], epoch: 13/50, iter: 400/834, loss: 0.35218, lr: 1.276625, top1: 0.55693, throughput: 314.64 | 2022-04-03 08:24:31.102 [rank:4] [train], epoch: 13/50, iter: 400/834, loss: 0.35534, lr: 1.276625, top1: 0.54630, throughput: 314.50 | 2022-04-03 08:24:31.116 [rank:5] [train], epoch: 13/50, iter: 400/834, loss: 0.35149, lr: 1.276625, top1: 0.55708, throughput: 314.37 | 2022-04-03 08:24:31.132 [rank:7] [train], epoch: 13/50, iter: 400/834, loss: 0.35326, lr: 1.276625, top1: 0.55318, throughput: 314.58 | 2022-04-03 08:24:31.134 [rank:6] [train], epoch: 13/50, iter: 400/834, loss: 0.35457, lr: 1.276625, top1: 0.55182, throughput: 314.33 | 2022-04-03 08:24:31.150 [rank:3] [train], epoch: 13/50, iter: 400/834, loss: 0.35345, lr: 1.276625, top1: 0.55609, throughput: 314.52 | 2022-04-03 08:24:31.152 [rank:1] [train], epoch: 13/50, iter: 400/834, loss: 0.35082, lr: 1.276625, top1: 0.55776, throughput: 314.63 | 2022-04-03 08:24:31.181 [rank:2] [train], epoch: 13/50, iter: 500/834, loss: 0.35056, lr: 1.272275, top1: 0.55328, throughput: 313.37 | 2022-04-03 08:25:32.368 [rank:4] [train], epoch: 13/50, iter: 500/834, loss: 0.35115, lr: 1.272275, top1: 0.55182, throughput: 313.45 | 2022-04-03 08:25:32.370 [rank:7] [train], epoch: 13/50, iter: 500/834, loss: 0.35244, lr: 1.272275, top1: 0.54969, throughput: 313.39 | 2022-04-03 08:25:32.399 [rank:5] [train], epoch: 13/50, iter: 500/834, loss: 0.35332, lr: 1.272275, top1: 0.55443, throughput: 313.35 | 2022-04-03 08:25:32.405 [rank:6] [train], epoch: 13/50, iter: 500/834, loss: 0.35155, lr: 1.272275, top1: 0.55344, throughput: 313.43 | 2022-04-03 08:25:32.407 [rank:3] [train], epoch: 13/50, iter: 500/834, loss: 0.35229, lr: 1.272275, top1: 0.55047, throughput: 313.44 | 2022-04-03 08:25:32.408 [rank:0] [train], epoch: 13/50, iter: 500/834, loss: 0.35433, lr: 1.272275, top1: 0.55203, throughput: 313.13 | 2022-04-03 08:25:32.419 [rank:1] [train], epoch: 13/50, iter: 500/834, loss: 0.35254, lr: 1.272275, top1: 0.55563, throughput: 313.44 | 2022-04-03 08:25:32.437 [rank:0] [train], epoch: 13/50, iter: 600/834, loss: 0.35155, lr: 1.267897, top1: 0.55203, throughput: 312.62 | 2022-04-03 08:26:33.835 [rank:7] [train], epoch: 13/50, iter: 600/834, loss: 0.35332, lr: 1.267897, top1: 0.55099, throughput: 312.35 | 2022-04-03 08:26:33.869 [rank:5] [train], epoch: 13/50, iter: 600/834, loss: 0.35137, lr: 1.267897, top1: 0.55490, throughput: 312.29 | 2022-04-03 08:26:33.886 [rank:3] [train], epoch: 13/50, iter: 600/834, loss: 0.35341, lr: 1.267897, top1: 0.55177, throughput: 312.18 | 2022-04-03 08:26:33.911 [rank:1] [train], epoch: 13/50, iter: 600/834, loss: 0.35284, lr: 1.267897, top1: 0.55443, throughput: 312.76 | 2022-04-03 08:26:33.826 [rank:4] [train], epoch: 13/50, iter: 600/834, loss: 0.35168, lr: 1.267897, top1: 0.55109, throughput: 311.98 | 2022-04-03 08:26:33.912 [rank:6] [train], epoch: 13/50, iter: 600/834, loss: 0.35535, lr: 1.267897, top1: 0.54911, throughput: 312.12 | 2022-04-03 08:26:33.922 [rank:2] [train], epoch: 13/50, iter: 600/834, loss: 0.34994, lr: 1.267897, top1: 0.56172, throughput: 311.86 | 2022-04-03 08:26:33.934 [rank:1] [train], epoch: 13/50, iter: 700/834, loss: 0.35193, lr: 1.263491, top1: 0.55573, throughput: 309.65 | 2022-04-03 08:27:35.832 [rank:5] [train], epoch: 13/50, iter: 700/834, loss: 0.35217, lr: 1.263491, top1: 0.55458, throughput: 309.89 | 2022-04-03 08:27:35.843 [rank:3] [train], epoch: 13/50, iter: 700/834, loss: 0.35532, lr: 1.263491, top1: 0.55005, throughput: 309.99 | 2022-04-03 08:27:35.849 [rank:7] [train], epoch: 13/50, iter: 700/834, loss: 0.35543, lr: 1.263491, top1: 0.54901, throughput: 309.72 | 2022-04-03 08:27:35.861 [rank:0] [train], epoch: 13/50, iter: 700/834, loss: 0.35311, lr: 1.263491, top1: 0.55349, throughput: 309.44 | 2022-04-03 08:27:35.882 [rank:2] [train], epoch: 13/50, iter: 700/834, loss: 0.35385, lr: 1.263491, top1: 0.55224, throughput: 309.91 | 2022-04-03 08:27:35.887 [rank:6] [train], epoch: 13/50, iter: 700/834, loss: 0.35304, lr: 1.263491, top1: 0.55266, throughput: 309.75 | 2022-04-03 08:27:35.907 [rank:4] [train], epoch: 13/50, iter: 700/834, loss: 0.35345, lr: 1.263491, top1: 0.55464, throughput: 309.59 | 2022-04-03 08:27:35.930 [rank:2] [train], epoch: 13/50, iter: 800/834, loss: 0.35265, lr: 1.259056, top1: 0.55536, throughput: 313.05 | 2022-04-03 08:28:37.219 [rank:7] [train], epoch: 13/50, iter: 800/834, loss: 0.35154, lr: 1.259056, top1: 0.55521, throughput: 312.84 | 2022-04-03 08:28:37.233 [rank:1] [train], epoch: 13/50, iter: 800/834, loss: 0.35288, lr: 1.259056, top1: 0.55036, throughput: 312.67 | 2022-04-03 08:28:37.239 [rank:3] [train], epoch: 13/50, iter: 800/834, loss: 0.35322, lr: 1.259056, top1: 0.55182, throughput: 312.70 | 2022-04-03 08:28:37.250 [rank:0] [train], epoch: 13/50, iter: 800/834, loss: 0.35550, lr: 1.259056, top1: 0.54708, throughput: 312.73 | 2022-04-03 08:28:37.276 [rank:4] [train], epoch: 13/50, iter: 800/834, loss: 0.35410, lr: 1.259056, top1: 0.55167, throughput: 312.93 | 2022-04-03 08:28:37.285 [rank:6] [train], epoch: 13/50, iter: 800/834, loss: 0.35179, lr: 1.259056, top1: 0.55594, throughput: 312.79 | 2022-04-03 08:28:37.289 [rank:5] [train], epoch: 13/50, iter: 800/834, loss: 0.35326, lr: 1.259056, top1: 0.55130, throughput: 312.89 | 2022-04-03 08:28:37.207 [rank:3] [train], epoch: 13/50, iter: 834/834, loss: 0.35197, lr: 1.257542, top1: 0.56005, throughput: 312.52 | 2022-04-03 08:28:58.139 [rank:7] [train], epoch: 13/50, iter: 834/834, loss: 0.34881, lr: 1.257542, top1: 0.56204, throughput: 312.24 | 2022-04-03 08:28:58.140 [rank:0] [train], epoch: 13/50, iter: 834/834, loss: 0.35029, lr: 1.257542, top1: 0.55683, throughput: 312.86 | 2022-04-03 08:28:58.141 [rank:1] [train], epoch: 13/50, iter: 834/834, loss: 0.35469, lr: 1.257542, top1: 0.54979, throughput: 312.28 | 2022-04-03 08:28:58.143 [rank:4] [train], epoch: 13/50, iter: 834/834, loss: 0.35484, lr: 1.257542, top1: 0.55208, throughput: 312.91 | 2022-04-03 08:28:58.147 [rank:5] [train], epoch: 13/50, iter: 834/834, loss: 0.35380, lr: 1.257542, top1: 0.54473, throughput: 311.62 | 2022-04-03 08:28:58.156 [rank:2] [train], epoch: 13/50, iter: 834/834, loss: 0.35186, lr: 1.257542, top1: 0.55806, throughput: 311.46 | 2022-04-03 08:28:58.179 [rank:6] [train], epoch: 13/50, iter: 834/834, loss: 0.34816, lr: 1.257542, top1: 0.55898, throughput: 312.22 | 2022-04-03 08:28:58.198 [rank:4] [eval], epoch: 13/50, iter: 125/125, loss: 0.00000, lr: 1.257542, top1: 0.57280, throughput: 493.23 | 2022-04-03 08:29:10.819 [rank:5] [eval], epoch: 13/50, iter: 125/125, loss: 0.00000, lr: 1.257542, top1: 0.56144, throughput: 493.55 | 2022-04-03 08:29:10.819 [rank:7] [eval], epoch: 13/50, iter: 125/125, loss: 0.00000, lr: 1.257542, top1: 0.57136, throughput: 492.89 | 2022-04-03 08:29:10.821 [rank:6] [eval], epoch: 13/50, iter: 125/125, loss: 0.00000, lr: 1.257542, top1: 0.56432, throughput: 495.08 | 2022-04-03 08:29:10.822 [rank:3] [eval], epoch: 13/50, iter: 125/125, loss: 0.00000, lr: 1.257542, top1: 0.56064, throughput: 492.46 | 2022-04-03 08:29:10.830 [rank:0] [eval], epoch: 13/50, iter: 125/125, loss: 0.00000, lr: 1.257542, top1: 0.57472, throughput: 492.54 | 2022-04-03 08:29:10.831 [rank:2] [eval], epoch: 13/50, iter: 125/125, loss: 0.00000, lr: 1.257542, top1: 0.56816, throughput: 493.85 | 2022-04-03 08:29:10.834 [rank:1] [eval], epoch: 13/50, iter: 125/125, loss: 0.00000, lr: 1.257542, top1: 0.56928, throughput: 491.23 | 2022-04-03 08:29:10.867 [rank:6] [train], epoch: 14/50, iter: 100/834, loss: 0.34817, lr: 1.253070, top1: 0.56302, throughput: 313.04 | 2022-04-03 08:30:12.156 [rank:1] [train], epoch: 14/50, iter: 100/834, loss: 0.34845, lr: 1.253070, top1: 0.56240, throughput: 313.25 | 2022-04-03 08:30:12.159 [rank:7] [train], epoch: 14/50, iter: 100/834, loss: 0.34768, lr: 1.253070, top1: 0.56510, throughput: 312.84 | 2022-04-03 08:30:12.193 [rank:3] [train], epoch: 14/50, iter: 100/834, loss: 0.34810, lr: 1.253070, top1: 0.56089, throughput: 312.82 | 2022-04-03 08:30:12.207 [rank:4] [train], epoch: 14/50, iter: 100/834, loss: 0.34630, lr: 1.253070, top1: 0.57094, throughput: 312.68 | 2022-04-03 08:30:12.223 [rank:0] [train], epoch: 14/50, iter: 100/834, loss: 0.34489, lr: 1.253070, top1: 0.56792, throughput: 312.70 | 2022-04-03 08:30:12.232 [rank:2] [train], epoch: 14/50, iter: 100/834, loss: 0.34835, lr: 1.253070, top1: 0.55651, throughput: 312.70 | 2022-04-03 08:30:12.236 [rank:5] [train], epoch: 14/50, iter: 100/834, loss: 0.34380, lr: 1.253070, top1: 0.56656, throughput: 312.44 | 2022-04-03 08:30:12.270 [rank:1] [train], epoch: 14/50, iter: 200/834, loss: 0.34872, lr: 1.248570, top1: 0.56354, throughput: 310.99 | 2022-04-03 08:31:13.898 [rank:5] [train], epoch: 14/50, iter: 200/834, loss: 0.34783, lr: 1.248570, top1: 0.56349, throughput: 311.45 | 2022-04-03 08:31:13.916 [rank:3] [train], epoch: 14/50, iter: 200/834, loss: 0.34775, lr: 1.248570, top1: 0.56161, throughput: 311.10 | 2022-04-03 08:31:13.922 [rank:6] [train], epoch: 14/50, iter: 200/834, loss: 0.34813, lr: 1.248570, top1: 0.56198, throughput: 310.82 | 2022-04-03 08:31:13.928 [rank:2] [train], epoch: 14/50, iter: 200/834, loss: 0.35038, lr: 1.248570, top1: 0.55786, throughput: 311.16 | 2022-04-03 08:31:13.941 [rank:4] [train], epoch: 14/50, iter: 200/834, loss: 0.34703, lr: 1.248570, top1: 0.56604, throughput: 311.07 | 2022-04-03 08:31:13.945 [rank:0] [train], epoch: 14/50, iter: 200/834, loss: 0.34868, lr: 1.248570, top1: 0.56099, throughput: 311.09 | 2022-04-03 08:31:13.950 [rank:7] [train], epoch: 14/50, iter: 200/834, loss: 0.35117, lr: 1.248570, top1: 0.55406, throughput: 310.89 | 2022-04-03 08:31:13.952 [rank:2] [train], epoch: 14/50, iter: 300/834, loss: 0.34851, lr: 1.244043, top1: 0.56208, throughput: 312.94 | 2022-04-03 08:32:15.294 [rank:7] [train], epoch: 14/50, iter: 300/834, loss: 0.34869, lr: 1.244043, top1: 0.55927, throughput: 312.99 | 2022-04-03 08:32:15.295 [rank:6] [train], epoch: 14/50, iter: 300/834, loss: 0.34887, lr: 1.244043, top1: 0.55969, throughput: 312.71 | 2022-04-03 08:32:15.327 [rank:3] [train], epoch: 14/50, iter: 300/834, loss: 0.35043, lr: 1.244043, top1: 0.55766, throughput: 312.65 | 2022-04-03 08:32:15.334 [rank:0] [train], epoch: 14/50, iter: 300/834, loss: 0.34941, lr: 1.244043, top1: 0.55693, throughput: 312.76 | 2022-04-03 08:32:15.339 [rank:1] [train], epoch: 14/50, iter: 300/834, loss: 0.34991, lr: 1.244043, top1: 0.56047, throughput: 312.41 | 2022-04-03 08:32:15.354 [rank:5] [train], epoch: 14/50, iter: 300/834, loss: 0.34833, lr: 1.244043, top1: 0.55859, throughput: 312.49 | 2022-04-03 08:32:15.359 [rank:4] [train], epoch: 14/50, iter: 300/834, loss: 0.35114, lr: 1.244043, top1: 0.55682, throughput: 312.50 | 2022-04-03 08:32:15.386 [rank:3] [train], epoch: 14/50, iter: 400/834, loss: 0.34607, lr: 1.239489, top1: 0.55917, throughput: 312.08 | 2022-04-03 08:33:16.857 [rank:2] [train], epoch: 14/50, iter: 400/834, loss: 0.34949, lr: 1.239489, top1: 0.55786, throughput: 311.84 | 2022-04-03 08:33:16.865 [rank:0] [train], epoch: 14/50, iter: 400/834, loss: 0.34975, lr: 1.239489, top1: 0.56245, throughput: 311.96 | 2022-04-03 08:33:16.885 [rank:7] [train], epoch: 14/50, iter: 400/834, loss: 0.35020, lr: 1.239489, top1: 0.55521, throughput: 311.73 | 2022-04-03 08:33:16.886 [rank:6] [train], epoch: 14/50, iter: 400/834, loss: 0.34805, lr: 1.239489, top1: 0.55818, throughput: 311.82 | 2022-04-03 08:33:16.900 [rank:1] [train], epoch: 14/50, iter: 400/834, loss: 0.34744, lr: 1.239489, top1: 0.56411, throughput: 311.94 | 2022-04-03 08:33:16.904 [rank:4] [train], epoch: 14/50, iter: 400/834, loss: 0.34412, lr: 1.239489, top1: 0.56958, throughput: 312.00 | 2022-04-03 08:33:16.924 [rank:5] [train], epoch: 14/50, iter: 400/834, loss: 0.34947, lr: 1.239489, top1: 0.55531, throughput: 311.81 | 2022-04-03 08:33:16.934 [rank:2] [train], epoch: 14/50, iter: 500/834, loss: 0.35179, lr: 1.234909, top1: 0.55339, throughput: 313.87 | 2022-04-03 08:34:18.037 [rank:1] [train], epoch: 14/50, iter: 500/834, loss: 0.34778, lr: 1.234909, top1: 0.56344, throughput: 313.96 | 2022-04-03 08:34:18.058 [rank:0] [train], epoch: 14/50, iter: 500/834, loss: 0.35088, lr: 1.234909, top1: 0.55417, throughput: 313.80 | 2022-04-03 08:34:18.071 [rank:5] [train], epoch: 14/50, iter: 500/834, loss: 0.35112, lr: 1.234909, top1: 0.55458, throughput: 314.04 | 2022-04-03 08:34:18.073 [rank:3] [train], epoch: 14/50, iter: 500/834, loss: 0.34902, lr: 1.234909, top1: 0.55677, throughput: 313.59 | 2022-04-03 08:34:18.084 [rank:4] [train], epoch: 14/50, iter: 500/834, loss: 0.34868, lr: 1.234909, top1: 0.56057, throughput: 313.93 | 2022-04-03 08:34:18.084 [rank:7] [train], epoch: 14/50, iter: 500/834, loss: 0.34887, lr: 1.234909, top1: 0.55786, throughput: 313.68 | 2022-04-03 08:34:18.095 [rank:6] [train], epoch: 14/50, iter: 500/834, loss: 0.35030, lr: 1.234909, top1: 0.55411, throughput: 314.12 | 2022-04-03 08:34:18.023 [rank:6] [train], epoch: 14/50, iter: 600/834, loss: 0.34974, lr: 1.230302, top1: 0.55625, throughput: 311.75 | 2022-04-03 08:35:19.611 [rank:1] [train], epoch: 14/50, iter: 600/834, loss: 0.34514, lr: 1.230302, top1: 0.56901, throughput: 311.92 | 2022-04-03 08:35:19.613 [rank:5] [train], epoch: 14/50, iter: 600/834, loss: 0.35203, lr: 1.230302, top1: 0.55255, throughput: 312.22 | 2022-04-03 08:35:19.567 [rank:0] [train], epoch: 14/50, iter: 600/834, loss: 0.34845, lr: 1.230302, top1: 0.55839, throughput: 311.80 | 2022-04-03 08:35:19.648 [rank:2] [train], epoch: 14/50, iter: 600/834, loss: 0.35181, lr: 1.230302, top1: 0.54802, throughput: 311.63 | 2022-04-03 08:35:19.650 [rank:3] [train], epoch: 14/50, iter: 600/834, loss: 0.34747, lr: 1.230302, top1: 0.55948, throughput: 311.85 | 2022-04-03 08:35:19.652 [rank:7] [train], epoch: 14/50, iter: 600/834, loss: 0.34876, lr: 1.230302, top1: 0.56141, throughput: 312.19 | 2022-04-03 08:35:19.595 [rank:4] [train], epoch: 14/50, iter: 600/834, loss: 0.34968, lr: 1.230302, top1: 0.55943, throughput: 311.62 | 2022-04-03 08:35:19.697 [rank:7] [train], epoch: 14/50, iter: 700/834, loss: 0.35094, lr: 1.225668, top1: 0.55510, throughput: 311.85 | 2022-04-03 08:36:21.163 [rank:6] [train], epoch: 14/50, iter: 700/834, loss: 0.35034, lr: 1.225668, top1: 0.55708, throughput: 311.80 | 2022-04-03 08:36:21.189 [rank:5] [train], epoch: 14/50, iter: 700/834, loss: 0.35116, lr: 1.225668, top1: 0.55193, throughput: 311.49 | 2022-04-03 08:36:21.207 [rank:4] [train], epoch: 14/50, iter: 700/834, loss: 0.34988, lr: 1.225668, top1: 0.55708, throughput: 312.06 | 2022-04-03 08:36:21.224 [rank:1] [train], epoch: 14/50, iter: 700/834, loss: 0.35114, lr: 1.225668, top1: 0.55693, throughput: 311.63 | 2022-04-03 08:36:21.225 [rank:2] [train], epoch: 14/50, iter: 700/834, loss: 0.35342, lr: 1.225668, top1: 0.55333, throughput: 311.74 | 2022-04-03 08:36:21.240 [rank:0] [train], epoch: 14/50, iter: 700/834, loss: 0.34924, lr: 1.225668, top1: 0.55760, throughput: 311.72 | 2022-04-03 08:36:21.243 [rank:3] [train], epoch: 14/50, iter: 700/834, loss: 0.34685, lr: 1.225668, top1: 0.56214, throughput: 311.71 | 2022-04-03 08:36:21.248 [rank:5] [train], epoch: 14/50, iter: 800/834, loss: 0.34810, lr: 1.221009, top1: 0.56203, throughput: 313.61 | 2022-04-03 08:37:22.430 [rank:7] [train], epoch: 14/50, iter: 800/834, loss: 0.35033, lr: 1.221009, top1: 0.55714, throughput: 313.20 | 2022-04-03 08:37:22.465 [rank:3] [train], epoch: 14/50, iter: 800/834, loss: 0.35042, lr: 1.221009, top1: 0.56318, throughput: 313.58 | 2022-04-03 08:37:22.476 [rank:2] [train], epoch: 14/50, iter: 800/834, loss: 0.35100, lr: 1.221009, top1: 0.55792, throughput: 313.47 | 2022-04-03 08:37:22.489 [rank:4] [train], epoch: 14/50, iter: 800/834, loss: 0.34810, lr: 1.221009, top1: 0.56234, throughput: 313.25 | 2022-04-03 08:37:22.516 [rank:1] [train], epoch: 14/50, iter: 800/834, loss: 0.34976, lr: 1.221009, top1: 0.55786, throughput: 313.65 | 2022-04-03 08:37:22.439 [rank:0] [train], epoch: 14/50, iter: 800/834, loss: 0.35298, lr: 1.221009, top1: 0.55198, throughput: 313.32 | 2022-04-03 08:37:22.522 [rank:6] [train], epoch: 14/50, iter: 800/834, loss: 0.34571, lr: 1.221009, top1: 0.56172, throughput: 313.03 | 2022-04-03 08:37:22.526 [rank:3] [train], epoch: 14/50, iter: 834/834, loss: 0.35142, lr: 1.219419, top1: 0.55760, throughput: 312.36 | 2022-04-03 08:37:43.375 [rank:5] [train], epoch: 14/50, iter: 834/834, loss: 0.34991, lr: 1.219419, top1: 0.55959, throughput: 311.61 | 2022-04-03 08:37:43.380 [rank:1] [train], epoch: 14/50, iter: 834/834, loss: 0.34674, lr: 1.219419, top1: 0.55699, throughput: 311.73 | 2022-04-03 08:37:43.380 [rank:2] [train], epoch: 14/50, iter: 834/834, loss: 0.34916, lr: 1.219419, top1: 0.55852, throughput: 312.45 | 2022-04-03 08:37:43.382 [rank:6] [train], epoch: 14/50, iter: 834/834, loss: 0.35359, lr: 1.219419, top1: 0.55009, throughput: 312.89 | 2022-04-03 08:37:43.389 [rank:4] [train], epoch: 14/50, iter: 834/834, loss: 0.34599, lr: 1.219419, top1: 0.57123, throughput: 312.65 | 2022-04-03 08:37:43.396 [rank:7] [train], epoch: 14/50, iter: 834/834, loss: 0.34857, lr: 1.219419, top1: 0.56066, throughput: 311.74 | 2022-04-03 08:37:43.406 [rank:0] [train], epoch: 14/50, iter: 834/834, loss: 0.35502, lr: 1.219419, top1: 0.54841, throughput: 311.66 | 2022-04-03 08:37:43.468 [rank:7] [eval], epoch: 14/50, iter: 125/125, loss: 0.00000, lr: 1.219419, top1: 0.56832, throughput: 489.30 | 2022-04-03 08:37:56.179 [rank:4] [eval], epoch: 14/50, iter: 125/125, loss: 0.00000, lr: 1.219419, top1: 0.56128, throughput: 488.89 | 2022-04-03 08:37:56.180 [rank:6] [eval], epoch: 14/50, iter: 125/125, loss: 0.00000, lr: 1.219419, top1: 0.56800, throughput: 488.46 | 2022-04-03 08:37:56.185 [rank:2] [eval], epoch: 14/50, iter: 125/125, loss: 0.00000, lr: 1.219419, top1: 0.55728, throughput: 488.11 | 2022-04-03 08:37:56.187 [rank:0] [eval], epoch: 14/50, iter: 125/125, loss: 0.00000, lr: 1.219419, top1: 0.57696, throughput: 491.21 | 2022-04-03 08:37:56.192 [rank:5] [eval], epoch: 14/50, iter: 125/125, loss: 0.00000, lr: 1.219419, top1: 0.55920, throughput: 487.81 | 2022-04-03 08:37:56.192 [rank:3] [eval], epoch: 14/50, iter: 125/125, loss: 0.00000, lr: 1.219419, top1: 0.55376, throughput: 487.49 | 2022-04-03 08:37:56.196 [rank:1] [eval], epoch: 14/50, iter: 125/125, loss: 0.00000, lr: 1.219419, top1: 0.56288, throughput: 486.38 | 2022-04-03 08:37:56.230 [rank:1] [train], epoch: 15/50, iter: 100/834, loss: 0.34459, lr: 1.214725, top1: 0.56552, throughput: 315.63 | 2022-04-03 08:38:57.062 [rank:6] [train], epoch: 15/50, iter: 100/834, loss: 0.34113, lr: 1.214725, top1: 0.57135, throughput: 315.36 | 2022-04-03 08:38:57.068 [rank:0] [train], epoch: 15/50, iter: 100/834, loss: 0.34336, lr: 1.214725, top1: 0.57010, throughput: 315.31 | 2022-04-03 08:38:57.085 [rank:5] [train], epoch: 15/50, iter: 100/834, loss: 0.34206, lr: 1.214725, top1: 0.57276, throughput: 315.18 | 2022-04-03 08:38:57.110 [rank:4] [train], epoch: 15/50, iter: 100/834, loss: 0.34806, lr: 1.214725, top1: 0.56313, throughput: 315.11 | 2022-04-03 08:38:57.111 [rank:7] [train], epoch: 15/50, iter: 100/834, loss: 0.34190, lr: 1.214725, top1: 0.56839, throughput: 315.05 | 2022-04-03 08:38:57.122 [rank:3] [train], epoch: 15/50, iter: 100/834, loss: 0.33940, lr: 1.214725, top1: 0.57615, throughput: 315.13 | 2022-04-03 08:38:57.123 [rank:2] [train], epoch: 15/50, iter: 100/834, loss: 0.34212, lr: 1.214725, top1: 0.57547, throughput: 315.03 | 2022-04-03 08:38:57.134 [rank:7] [train], epoch: 15/50, iter: 200/834, loss: 0.34624, lr: 1.210006, top1: 0.56729, throughput: 312.61 | 2022-04-03 08:39:58.540 [rank:0] [train], epoch: 15/50, iter: 200/834, loss: 0.34245, lr: 1.210006, top1: 0.57187, throughput: 312.38 | 2022-04-03 08:39:58.548 [rank:2] [train], epoch: 15/50, iter: 200/834, loss: 0.34309, lr: 1.210006, top1: 0.57109, throughput: 312.59 | 2022-04-03 08:39:58.556 [rank:6] [train], epoch: 15/50, iter: 200/834, loss: 0.34303, lr: 1.210006, top1: 0.56932, throughput: 312.25 | 2022-04-03 08:39:58.557 [rank:1] [train], epoch: 15/50, iter: 200/834, loss: 0.34392, lr: 1.210006, top1: 0.56854, throughput: 312.19 | 2022-04-03 08:39:58.562 [rank:3] [train], epoch: 15/50, iter: 200/834, loss: 0.34658, lr: 1.210006, top1: 0.55885, throughput: 312.46 | 2022-04-03 08:39:58.571 [rank:5] [train], epoch: 15/50, iter: 200/834, loss: 0.34774, lr: 1.210006, top1: 0.56474, throughput: 312.34 | 2022-04-03 08:39:58.581 [rank:4] [train], epoch: 15/50, iter: 200/834, loss: 0.34627, lr: 1.210006, top1: 0.57078, throughput: 312.31 | 2022-04-03 08:39:58.588 [rank:3] [train], epoch: 15/50, iter: 300/834, loss: 0.34613, lr: 1.205262, top1: 0.56260, throughput: 312.15 | 2022-04-03 08:41:00.080 [rank:0] [train], epoch: 15/50, iter: 300/834, loss: 0.34786, lr: 1.205262, top1: 0.56135, throughput: 312.01 | 2022-04-03 08:41:00.085 [rank:5] [train], epoch: 15/50, iter: 300/834, loss: 0.34585, lr: 1.205262, top1: 0.56917, throughput: 312.09 | 2022-04-03 08:41:00.101 [rank:1] [train], epoch: 15/50, iter: 300/834, loss: 0.34384, lr: 1.205262, top1: 0.56771, throughput: 311.97 | 2022-04-03 08:41:00.107 [rank:4] [train], epoch: 15/50, iter: 300/834, loss: 0.34716, lr: 1.205262, top1: 0.56443, throughput: 311.98 | 2022-04-03 08:41:00.129 [rank:2] [train], epoch: 15/50, iter: 300/834, loss: 0.34910, lr: 1.205262, top1: 0.55979, throughput: 311.80 | 2022-04-03 08:41:00.133 [rank:6] [train], epoch: 15/50, iter: 300/834, loss: 0.34769, lr: 1.205262, top1: 0.56328, throughput: 311.80 | 2022-04-03 08:41:00.135 [rank:7] [train], epoch: 15/50, iter: 300/834, loss: 0.34507, lr: 1.205262, top1: 0.56755, throughput: 311.69 | 2022-04-03 08:41:00.140 [rank:0] [train], epoch: 15/50, iter: 400/834, loss: 0.34710, lr: 1.200493, top1: 0.56135, throughput: 313.49 | 2022-04-03 08:42:01.331 [rank:1] [train], epoch: 15/50, iter: 400/834, loss: 0.34555, lr: 1.200493, top1: 0.56443, throughput: 313.55 | 2022-04-03 08:42:01.340 [rank:7] [train], epoch: 15/50, iter: 400/834, loss: 0.34294, lr: 1.200493, top1: 0.57047, throughput: 313.59 | 2022-04-03 08:42:01.366 [rank:5] [train], epoch: 15/50, iter: 400/834, loss: 0.34625, lr: 1.200493, top1: 0.56354, throughput: 313.36 | 2022-04-03 08:42:01.373 [rank:3] [train], epoch: 15/50, iter: 400/834, loss: 0.34709, lr: 1.200493, top1: 0.56198, throughput: 313.20 | 2022-04-03 08:42:01.383 [rank:4] [train], epoch: 15/50, iter: 400/834, loss: 0.34880, lr: 1.200493, top1: 0.55823, throughput: 313.45 | 2022-04-03 08:42:01.383 [rank:2] [train], epoch: 15/50, iter: 400/834, loss: 0.34606, lr: 1.200493, top1: 0.56542, throughput: 313.37 | 2022-04-03 08:42:01.402 [rank:6] [train], epoch: 15/50, iter: 400/834, loss: 0.34509, lr: 1.200493, top1: 0.56807, throughput: 313.77 | 2022-04-03 08:42:01.325 [rank:0] [train], epoch: 15/50, iter: 500/834, loss: 0.34403, lr: 1.195700, top1: 0.56693, throughput: 312.06 | 2022-04-03 08:43:02.857 [rank:6] [train], epoch: 15/50, iter: 500/834, loss: 0.34586, lr: 1.195700, top1: 0.56708, throughput: 312.02 | 2022-04-03 08:43:02.860 [rank:7] [train], epoch: 15/50, iter: 500/834, loss: 0.34807, lr: 1.195700, top1: 0.56141, throughput: 312.07 | 2022-04-03 08:43:02.890 [rank:4] [train], epoch: 15/50, iter: 500/834, loss: 0.34655, lr: 1.195700, top1: 0.56568, throughput: 312.12 | 2022-04-03 08:43:02.898 [rank:3] [train], epoch: 15/50, iter: 500/834, loss: 0.34621, lr: 1.195700, top1: 0.56130, throughput: 312.10 | 2022-04-03 08:43:02.902 [rank:2] [train], epoch: 15/50, iter: 500/834, loss: 0.34510, lr: 1.195700, top1: 0.56422, throughput: 312.14 | 2022-04-03 08:43:02.912 [rank:1] [train], epoch: 15/50, iter: 500/834, loss: 0.34715, lr: 1.195700, top1: 0.56151, throughput: 311.83 | 2022-04-03 08:43:02.913 [rank:5] [train], epoch: 15/50, iter: 500/834, loss: 0.34766, lr: 1.195700, top1: 0.55729, throughput: 311.88 | 2022-04-03 08:43:02.934 [rank:1] [train], epoch: 15/50, iter: 600/834, loss: 0.34433, lr: 1.190882, top1: 0.57099, throughput: 313.58 | 2022-04-03 08:44:04.142 [rank:3] [train], epoch: 15/50, iter: 600/834, loss: 0.34619, lr: 1.190882, top1: 0.56740, throughput: 313.49 | 2022-04-03 08:44:04.149 [rank:0] [train], epoch: 15/50, iter: 600/834, loss: 0.34546, lr: 1.190882, top1: 0.56719, throughput: 313.22 | 2022-04-03 08:44:04.155 [rank:5] [train], epoch: 15/50, iter: 600/834, loss: 0.34658, lr: 1.190882, top1: 0.56859, throughput: 313.48 | 2022-04-03 08:44:04.183 [rank:4] [train], epoch: 15/50, iter: 600/834, loss: 0.34699, lr: 1.190882, top1: 0.56391, throughput: 313.25 | 2022-04-03 08:44:04.192 [rank:7] [train], epoch: 15/50, iter: 600/834, loss: 0.34668, lr: 1.190882, top1: 0.56292, throughput: 313.15 | 2022-04-03 08:44:04.202 [rank:6] [train], epoch: 15/50, iter: 600/834, loss: 0.34743, lr: 1.190882, top1: 0.55948, throughput: 312.99 | 2022-04-03 08:44:04.203 [rank:2] [train], epoch: 15/50, iter: 600/834, loss: 0.34500, lr: 1.190882, top1: 0.56990, throughput: 313.14 | 2022-04-03 08:44:04.226 [rank:1] [train], epoch: 15/50, iter: 700/834, loss: 0.34674, lr: 1.186040, top1: 0.55859, throughput: 312.95 | 2022-04-03 08:45:05.493 [rank:5] [train], epoch: 15/50, iter: 700/834, loss: 0.34723, lr: 1.186040, top1: 0.56000, throughput: 313.16 | 2022-04-03 08:45:05.494 [rank:0] [train], epoch: 15/50, iter: 700/834, loss: 0.34771, lr: 1.186040, top1: 0.55958, throughput: 312.99 | 2022-04-03 08:45:05.499 [rank:2] [train], epoch: 15/50, iter: 700/834, loss: 0.34611, lr: 1.186040, top1: 0.56193, throughput: 313.23 | 2022-04-03 08:45:05.522 [rank:6] [train], epoch: 15/50, iter: 700/834, loss: 0.34957, lr: 1.186040, top1: 0.56354, throughput: 313.05 | 2022-04-03 08:45:05.536 [rank:7] [train], epoch: 15/50, iter: 700/834, loss: 0.34672, lr: 1.186040, top1: 0.56297, throughput: 313.03 | 2022-04-03 08:45:05.538 [rank:4] [train], epoch: 15/50, iter: 700/834, loss: 0.34624, lr: 1.186040, top1: 0.57047, throughput: 312.94 | 2022-04-03 08:45:05.546 [rank:3] [train], epoch: 15/50, iter: 700/834, loss: 0.34739, lr: 1.186040, top1: 0.56453, throughput: 312.70 | 2022-04-03 08:45:05.549 [rank:2] [train], epoch: 15/50, iter: 800/834, loss: 0.34623, lr: 1.181175, top1: 0.56464, throughput: 312.61 | 2022-04-03 08:46:06.941 [rank:5] [train], epoch: 15/50, iter: 800/834, loss: 0.34450, lr: 1.181175, top1: 0.56828, throughput: 312.46 | 2022-04-03 08:46:06.942 [rank:3] [train], epoch: 15/50, iter: 800/834, loss: 0.34820, lr: 1.181175, top1: 0.56297, throughput: 312.73 | 2022-04-03 08:46:06.943 [rank:1] [train], epoch: 15/50, iter: 800/834, loss: 0.34454, lr: 1.181175, top1: 0.56573, throughput: 312.45 | 2022-04-03 08:46:06.944 [rank:4] [train], epoch: 15/50, iter: 800/834, loss: 0.34819, lr: 1.181175, top1: 0.56188, throughput: 312.57 | 2022-04-03 08:46:06.972 [rank:6] [train], epoch: 15/50, iter: 800/834, loss: 0.34624, lr: 1.181175, top1: 0.56438, throughput: 312.48 | 2022-04-03 08:46:06.979 [rank:0] [train], epoch: 15/50, iter: 800/834, loss: 0.34809, lr: 1.181175, top1: 0.56214, throughput: 312.22 | 2022-04-03 08:46:06.994 [rank:7] [train], epoch: 15/50, iter: 800/834, loss: 0.34819, lr: 1.181175, top1: 0.56385, throughput: 312.41 | 2022-04-03 08:46:06.995 [rank:1] [train], epoch: 15/50, iter: 834/834, loss: 0.34797, lr: 1.179515, top1: 0.56449, throughput: 310.97 | 2022-04-03 08:46:27.936 [rank:5] [train], epoch: 15/50, iter: 834/834, loss: 0.34245, lr: 1.179515, top1: 0.56924, throughput: 310.92 | 2022-04-03 08:46:27.937 [rank:7] [train], epoch: 15/50, iter: 834/834, loss: 0.34852, lr: 1.179515, top1: 0.55055, throughput: 311.64 | 2022-04-03 08:46:27.943 [rank:4] [train], epoch: 15/50, iter: 834/834, loss: 0.34467, lr: 1.179515, top1: 0.57001, throughput: 311.25 | 2022-04-03 08:46:27.945 [rank:2] [train], epoch: 15/50, iter: 834/834, loss: 0.34781, lr: 1.179515, top1: 0.56158, throughput: 310.76 | 2022-04-03 08:46:27.948 [rank:3] [train], epoch: 15/50, iter: 834/834, loss: 0.34733, lr: 1.179515, top1: 0.56311, throughput: 310.74 | 2022-04-03 08:46:27.950 [rank:6] [train], epoch: 15/50, iter: 834/834, loss: 0.34452, lr: 1.179515, top1: 0.56526, throughput: 311.25 | 2022-04-03 08:46:27.952 [rank:0] [train], epoch: 15/50, iter: 834/834, loss: 0.34786, lr: 1.179515, top1: 0.55653, throughput: 310.75 | 2022-04-03 08:46:28.001 [rank:6] [eval], epoch: 15/50, iter: 125/125, loss: 0.00000, lr: 1.179515, top1: 0.55872, throughput: 493.86 | 2022-04-03 08:46:40.608 [rank:4] [eval], epoch: 15/50, iter: 125/125, loss: 0.00000, lr: 1.179515, top1: 0.55856, throughput: 493.53 | 2022-04-03 08:46:40.609 [rank:2] [eval], epoch: 15/50, iter: 125/125, loss: 0.00000, lr: 1.179515, top1: 0.56640, throughput: 493.56 | 2022-04-03 08:46:40.611 [rank:7] [eval], epoch: 15/50, iter: 125/125, loss: 0.00000, lr: 1.179515, top1: 0.56768, throughput: 493.20 | 2022-04-03 08:46:40.615 [rank:0] [eval], epoch: 15/50, iter: 125/125, loss: 0.00000, lr: 1.179515, top1: 0.56656, throughput: 495.32 | 2022-04-03 08:46:40.620 [rank:5] [eval], epoch: 15/50, iter: 125/125, loss: 0.00000, lr: 1.179515, top1: 0.55008, throughput: 492.78 | 2022-04-03 08:46:40.621 [rank:3] [eval], epoch: 15/50, iter: 125/125, loss: 0.00000, lr: 1.179515, top1: 0.55936, throughput: 492.51 | 2022-04-03 08:46:40.640 [rank:1] [eval], epoch: 15/50, iter: 125/125, loss: 0.00000, lr: 1.179515, top1: 0.56512, throughput: 491.40 | 2022-04-03 08:46:40.655 [rank:5] [train], epoch: 16/50, iter: 100/834, loss: 0.33990, lr: 1.174618, top1: 0.57667, throughput: 309.78 | 2022-04-03 08:47:42.601 [rank:0] [train], epoch: 16/50, iter: 100/834, loss: 0.33870, lr: 1.174618, top1: 0.57818, throughput: 309.77 | 2022-04-03 08:47:42.601 [rank:2] [train], epoch: 16/50, iter: 100/834, loss: 0.33732, lr: 1.174618, top1: 0.58547, throughput: 309.60 | 2022-04-03 08:47:42.626 [rank:4] [train], epoch: 16/50, iter: 100/834, loss: 0.33962, lr: 1.174618, top1: 0.57828, throughput: 309.46 | 2022-04-03 08:47:42.653 [rank:6] [train], epoch: 16/50, iter: 100/834, loss: 0.33857, lr: 1.174618, top1: 0.57865, throughput: 309.36 | 2022-04-03 08:47:42.673 [rank:7] [train], epoch: 16/50, iter: 100/834, loss: 0.34064, lr: 1.174618, top1: 0.57255, throughput: 309.82 | 2022-04-03 08:47:42.586 [rank:1] [train], epoch: 16/50, iter: 100/834, loss: 0.34227, lr: 1.174618, top1: 0.57000, throughput: 309.57 | 2022-04-03 08:47:42.676 [rank:3] [train], epoch: 16/50, iter: 100/834, loss: 0.34190, lr: 1.174618, top1: 0.57255, throughput: 309.88 | 2022-04-03 08:47:42.600 [rank:0] [train], epoch: 16/50, iter: 200/834, loss: 0.34395, lr: 1.169698, top1: 0.56625, throughput: 311.68 | 2022-04-03 08:48:44.202 [rank:5] [train], epoch: 16/50, iter: 200/834, loss: 0.34121, lr: 1.169698, top1: 0.57422, throughput: 311.65 | 2022-04-03 08:48:44.208 [rank:1] [train], epoch: 16/50, iter: 200/834, loss: 0.34106, lr: 1.169698, top1: 0.57156, throughput: 311.98 | 2022-04-03 08:48:44.219 [rank:3] [train], epoch: 16/50, iter: 200/834, loss: 0.34256, lr: 1.169698, top1: 0.57172, throughput: 311.57 | 2022-04-03 08:48:44.224 [rank:7] [train], epoch: 16/50, iter: 200/834, loss: 0.34154, lr: 1.169698, top1: 0.57464, throughput: 311.50 | 2022-04-03 08:48:44.224 [rank:6] [train], epoch: 16/50, iter: 200/834, loss: 0.34082, lr: 1.169698, top1: 0.57344, throughput: 311.86 | 2022-04-03 08:48:44.238 [rank:2] [train], epoch: 16/50, iter: 200/834, loss: 0.34033, lr: 1.169698, top1: 0.57589, throughput: 311.62 | 2022-04-03 08:48:44.239 [rank:4] [train], epoch: 16/50, iter: 200/834, loss: 0.34258, lr: 1.169698, top1: 0.56979, throughput: 311.63 | 2022-04-03 08:48:44.265 [rank:0] [train], epoch: 16/50, iter: 300/834, loss: 0.34436, lr: 1.164755, top1: 0.56937, throughput: 314.31 | 2022-04-03 08:49:45.288 [rank:1] [train], epoch: 16/50, iter: 300/834, loss: 0.34283, lr: 1.164755, top1: 0.57120, throughput: 314.05 | 2022-04-03 08:49:45.356 [rank:2] [train], epoch: 16/50, iter: 300/834, loss: 0.34197, lr: 1.164755, top1: 0.57099, throughput: 314.14 | 2022-04-03 08:49:45.358 [rank:4] [train], epoch: 16/50, iter: 300/834, loss: 0.34300, lr: 1.164755, top1: 0.56839, throughput: 314.22 | 2022-04-03 08:49:45.370 [rank:6] [train], epoch: 16/50, iter: 300/834, loss: 0.34120, lr: 1.164755, top1: 0.57589, throughput: 314.06 | 2022-04-03 08:49:45.372 [rank:5] [train], epoch: 16/50, iter: 300/834, loss: 0.33935, lr: 1.164755, top1: 0.58073, throughput: 313.86 | 2022-04-03 08:49:45.381 [rank:7] [train], epoch: 16/50, iter: 300/834, loss: 0.34327, lr: 1.164755, top1: 0.57266, throughput: 313.94 | 2022-04-03 08:49:45.383 [rank:3] [train], epoch: 16/50, iter: 300/834, loss: 0.34166, lr: 1.164755, top1: 0.57047, throughput: 313.82 | 2022-04-03 08:49:45.406 [rank:1] [train], epoch: 16/50, iter: 400/834, loss: 0.34388, lr: 1.159790, top1: 0.56755, throughput: 311.13 | 2022-04-03 08:50:47.067 [rank:2] [train], epoch: 16/50, iter: 400/834, loss: 0.34520, lr: 1.159790, top1: 0.56615, throughput: 311.09 | 2022-04-03 08:50:47.077 [rank:0] [train], epoch: 16/50, iter: 400/834, loss: 0.34356, lr: 1.159790, top1: 0.56661, throughput: 310.73 | 2022-04-03 08:50:47.078 [rank:7] [train], epoch: 16/50, iter: 400/834, loss: 0.33805, lr: 1.159790, top1: 0.57906, throughput: 311.15 | 2022-04-03 08:50:47.089 [rank:6] [train], epoch: 16/50, iter: 400/834, loss: 0.34022, lr: 1.159790, top1: 0.57307, throughput: 311.03 | 2022-04-03 08:50:47.102 [rank:5] [train], epoch: 16/50, iter: 400/834, loss: 0.34410, lr: 1.159790, top1: 0.56562, throughput: 311.00 | 2022-04-03 08:50:47.117 [rank:4] [train], epoch: 16/50, iter: 400/834, loss: 0.34356, lr: 1.159790, top1: 0.56875, throughput: 310.93 | 2022-04-03 08:50:47.120 [rank:3] [train], epoch: 16/50, iter: 400/834, loss: 0.34271, lr: 1.159790, top1: 0.57245, throughput: 311.08 | 2022-04-03 08:50:47.126 [rank:6] [train], epoch: 16/50, iter: 500/834, loss: 0.34594, lr: 1.154803, top1: 0.56458, throughput: 312.88 | 2022-04-03 08:51:48.468 [rank:3] [train], epoch: 16/50, iter: 500/834, loss: 0.34534, lr: 1.154803, top1: 0.56448, throughput: 312.82 | 2022-04-03 08:51:48.503 [rank:4] [train], epoch: 16/50, iter: 500/834, loss: 0.34068, lr: 1.154803, top1: 0.57437, throughput: 312.73 | 2022-04-03 08:51:48.515 [rank:2] [train], epoch: 16/50, iter: 500/834, loss: 0.34208, lr: 1.154803, top1: 0.57521, throughput: 312.49 | 2022-04-03 08:51:48.518 [rank:1] [train], epoch: 16/50, iter: 500/834, loss: 0.34178, lr: 1.154803, top1: 0.57010, throughput: 312.31 | 2022-04-03 08:51:48.545 [rank:0] [train], epoch: 16/50, iter: 500/834, loss: 0.34600, lr: 1.154803, top1: 0.56354, throughput: 312.35 | 2022-04-03 08:51:48.547 [rank:7] [train], epoch: 16/50, iter: 500/834, loss: 0.34036, lr: 1.154803, top1: 0.57807, throughput: 312.40 | 2022-04-03 08:51:48.549 [rank:5] [train], epoch: 16/50, iter: 500/834, loss: 0.34394, lr: 1.154803, top1: 0.57016, throughput: 312.53 | 2022-04-03 08:51:48.551 [rank:6] [train], epoch: 16/50, iter: 600/834, loss: 0.34206, lr: 1.149793, top1: 0.57312, throughput: 312.16 | 2022-04-03 08:52:49.974 [rank:0] [train], epoch: 16/50, iter: 600/834, loss: 0.34440, lr: 1.149793, top1: 0.56589, throughput: 312.53 | 2022-04-03 08:52:49.982 [rank:2] [train], epoch: 16/50, iter: 600/834, loss: 0.34280, lr: 1.149793, top1: 0.57083, throughput: 312.37 | 2022-04-03 08:52:49.983 [rank:4] [train], epoch: 16/50, iter: 600/834, loss: 0.34398, lr: 1.149793, top1: 0.57271, throughput: 312.33 | 2022-04-03 08:52:49.989 [rank:3] [train], epoch: 16/50, iter: 600/834, loss: 0.34427, lr: 1.149793, top1: 0.56922, throughput: 312.26 | 2022-04-03 08:52:49.991 [rank:1] [train], epoch: 16/50, iter: 600/834, loss: 0.34303, lr: 1.149793, top1: 0.56958, throughput: 312.43 | 2022-04-03 08:52:49.999 [rank:7] [train], epoch: 16/50, iter: 600/834, loss: 0.34289, lr: 1.149793, top1: 0.57068, throughput: 312.41 | 2022-04-03 08:52:50.007 [rank:5] [train], epoch: 16/50, iter: 600/834, loss: 0.34610, lr: 1.149793, top1: 0.56932, throughput: 312.76 | 2022-04-03 08:52:49.940 [rank:6] [train], epoch: 16/50, iter: 700/834, loss: 0.34209, lr: 1.144762, top1: 0.57182, throughput: 312.70 | 2022-04-03 08:53:51.374 [rank:2] [train], epoch: 16/50, iter: 700/834, loss: 0.34529, lr: 1.144762, top1: 0.56682, throughput: 312.69 | 2022-04-03 08:53:51.387 [rank:3] [train], epoch: 16/50, iter: 700/834, loss: 0.34320, lr: 1.144762, top1: 0.56833, throughput: 312.54 | 2022-04-03 08:53:51.422 [rank:0] [train], epoch: 16/50, iter: 700/834, loss: 0.34464, lr: 1.144762, top1: 0.56521, throughput: 312.39 | 2022-04-03 08:53:51.443 [rank:1] [train], epoch: 16/50, iter: 700/834, loss: 0.34185, lr: 1.144762, top1: 0.57391, throughput: 312.47 | 2022-04-03 08:53:51.445 [rank:4] [train], epoch: 16/50, iter: 700/834, loss: 0.34326, lr: 1.144762, top1: 0.57010, throughput: 312.35 | 2022-04-03 08:53:51.459 [rank:7] [train], epoch: 16/50, iter: 700/834, loss: 0.34396, lr: 1.144762, top1: 0.56656, throughput: 312.43 | 2022-04-03 08:53:51.461 [rank:5] [train], epoch: 16/50, iter: 700/834, loss: 0.34707, lr: 1.144762, top1: 0.56302, throughput: 312.50 | 2022-04-03 08:53:51.380 [rank:3] [train], epoch: 16/50, iter: 800/834, loss: 0.34215, lr: 1.139709, top1: 0.57146, throughput: 314.38 | 2022-04-03 08:54:52.496 [rank:1] [train], epoch: 16/50, iter: 800/834, loss: 0.34290, lr: 1.139709, top1: 0.57000, throughput: 314.18 | 2022-04-03 08:54:52.556 [rank:2] [train], epoch: 16/50, iter: 800/834, loss: 0.34059, lr: 1.139709, top1: 0.57229, throughput: 313.87 | 2022-04-03 08:54:52.559 [rank:7] [train], epoch: 16/50, iter: 800/834, loss: 0.34453, lr: 1.139709, top1: 0.56995, throughput: 314.14 | 2022-04-03 08:54:52.580 [rank:6] [train], epoch: 16/50, iter: 800/834, loss: 0.34388, lr: 1.139709, top1: 0.57354, throughput: 313.66 | 2022-04-03 08:54:52.587 [rank:0] [train], epoch: 16/50, iter: 800/834, loss: 0.34164, lr: 1.139709, top1: 0.57151, throughput: 314.01 | 2022-04-03 08:54:52.588 [rank:5] [train], epoch: 16/50, iter: 800/834, loss: 0.34325, lr: 1.139709, top1: 0.56625, throughput: 313.69 | 2022-04-03 08:54:52.588 [rank:4] [train], epoch: 16/50, iter: 800/834, loss: 0.34411, lr: 1.139709, top1: 0.56677, throughput: 314.09 | 2022-04-03 08:54:52.589 [rank:5] [train], epoch: 16/50, iter: 834/834, loss: 0.34848, lr: 1.137987, top1: 0.56464, throughput: 311.54 | 2022-04-03 08:55:13.542 [rank:1] [train], epoch: 16/50, iter: 834/834, loss: 0.34569, lr: 1.137987, top1: 0.56587, throughput: 310.94 | 2022-04-03 08:55:13.550 [rank:6] [train], epoch: 16/50, iter: 834/834, loss: 0.34466, lr: 1.137987, top1: 0.56786, throughput: 311.23 | 2022-04-03 08:55:13.562 [rank:2] [train], epoch: 16/50, iter: 834/834, loss: 0.34732, lr: 1.137987, top1: 0.56097, throughput: 310.73 | 2022-04-03 08:55:13.567 [rank:7] [train], epoch: 16/50, iter: 834/834, loss: 0.34445, lr: 1.137987, top1: 0.56281, throughput: 310.94 | 2022-04-03 08:55:13.575 [rank:4] [train], epoch: 16/50, iter: 834/834, loss: 0.33828, lr: 1.137987, top1: 0.58119, throughput: 310.46 | 2022-04-03 08:55:13.616 [rank:0] [train], epoch: 16/50, iter: 834/834, loss: 0.34454, lr: 1.137987, top1: 0.56373, throughput: 310.33 | 2022-04-03 08:55:13.624 [rank:3] [train], epoch: 16/50, iter: 834/834, loss: 0.34105, lr: 1.137987, top1: 0.57230, throughput: 308.86 | 2022-04-03 08:55:13.631 [rank:0] [eval], epoch: 16/50, iter: 125/125, loss: 0.00000, lr: 1.137987, top1: 0.55712, throughput: 489.65 | 2022-04-03 08:55:26.388 [rank:2] [eval], epoch: 16/50, iter: 125/125, loss: 0.00000, lr: 1.137987, top1: 0.54752, throughput: 487.30 | 2022-04-03 08:55:26.393 [rank:7] [eval], epoch: 16/50, iter: 125/125, loss: 0.00000, lr: 1.137987, top1: 0.55296, throughput: 487.19 | 2022-04-03 08:55:26.403 [rank:5] [eval], epoch: 16/50, iter: 125/125, loss: 0.00000, lr: 1.137987, top1: 0.54352, throughput: 485.22 | 2022-04-03 08:55:26.423 [rank:3] [eval], epoch: 16/50, iter: 125/125, loss: 0.00000, lr: 1.137987, top1: 0.54480, throughput: 488.51 | 2022-04-03 08:55:26.425 [rank:6] [eval], epoch: 16/50, iter: 125/125, loss: 0.00000, lr: 1.137987, top1: 0.53936, throughput: 485.91 | 2022-04-03 08:55:26.425 [rank:4] [eval], epoch: 16/50, iter: 125/125, loss: 0.00000, lr: 1.137987, top1: 0.54384, throughput: 487.77 | 2022-04-03 08:55:26.429 [rank:1] [eval], epoch: 16/50, iter: 125/125, loss: 0.00000, lr: 1.137987, top1: 0.55408, throughput: 484.56 | 2022-04-03 08:55:26.448 [rank:7] [train], epoch: 17/50, iter: 100/834, loss: 0.33897, lr: 1.132906, top1: 0.57120, throughput: 313.79 | 2022-04-03 08:56:27.591 [rank:6] [train], epoch: 17/50, iter: 100/834, loss: 0.33850, lr: 1.132906, top1: 0.57719, throughput: 313.90 | 2022-04-03 08:56:27.591 [rank:0] [train], epoch: 17/50, iter: 100/834, loss: 0.33292, lr: 1.132906, top1: 0.59089, throughput: 313.70 | 2022-04-03 08:56:27.592 [rank:2] [train], epoch: 17/50, iter: 100/834, loss: 0.33561, lr: 1.132906, top1: 0.58214, throughput: 313.71 | 2022-04-03 08:56:27.596 [rank:4] [train], epoch: 17/50, iter: 100/834, loss: 0.33784, lr: 1.132906, top1: 0.57990, throughput: 313.89 | 2022-04-03 08:56:27.597 [rank:3] [train], epoch: 17/50, iter: 100/834, loss: 0.33780, lr: 1.132906, top1: 0.58245, throughput: 313.85 | 2022-04-03 08:56:27.601 [rank:5] [train], epoch: 17/50, iter: 100/834, loss: 0.33717, lr: 1.132906, top1: 0.58161, throughput: 313.77 | 2022-04-03 08:56:27.614 [rank:1] [train], epoch: 17/50, iter: 100/834, loss: 0.34052, lr: 1.132906, top1: 0.57260, throughput: 313.81 | 2022-04-03 08:56:27.631 [rank:1] [train], epoch: 17/50, iter: 200/834, loss: 0.33763, lr: 1.127805, top1: 0.58297, throughput: 313.56 | 2022-04-03 08:57:28.864 [rank:2] [train], epoch: 17/50, iter: 200/834, loss: 0.33696, lr: 1.127805, top1: 0.57786, throughput: 313.33 | 2022-04-03 08:57:28.874 [rank:6] [train], epoch: 17/50, iter: 200/834, loss: 0.33700, lr: 1.127805, top1: 0.57854, throughput: 313.27 | 2022-04-03 08:57:28.879 [rank:7] [train], epoch: 17/50, iter: 200/834, loss: 0.33543, lr: 1.127805, top1: 0.58609, throughput: 313.08 | 2022-04-03 08:57:28.917 [rank:4] [train], epoch: 17/50, iter: 200/834, loss: 0.33989, lr: 1.127805, top1: 0.57911, throughput: 313.07 | 2022-04-03 08:57:28.925 [rank:3] [train], epoch: 17/50, iter: 200/834, loss: 0.33742, lr: 1.127805, top1: 0.58005, throughput: 313.04 | 2022-04-03 08:57:28.934 [rank:0] [train], epoch: 17/50, iter: 200/834, loss: 0.33706, lr: 1.127805, top1: 0.58276, throughput: 312.91 | 2022-04-03 08:57:28.951 [rank:5] [train], epoch: 17/50, iter: 200/834, loss: 0.33883, lr: 1.127805, top1: 0.57719, throughput: 313.00 | 2022-04-03 08:57:28.956 [rank:4] [train], epoch: 17/50, iter: 300/834, loss: 0.33362, lr: 1.122683, top1: 0.58927, throughput: 313.72 | 2022-04-03 08:58:30.127 [rank:3] [train], epoch: 17/50, iter: 300/834, loss: 0.33713, lr: 1.122683, top1: 0.58000, throughput: 313.66 | 2022-04-03 08:58:30.147 [rank:6] [train], epoch: 17/50, iter: 300/834, loss: 0.33814, lr: 1.122683, top1: 0.57865, throughput: 313.34 | 2022-04-03 08:58:30.155 [rank:1] [train], epoch: 17/50, iter: 300/834, loss: 0.34007, lr: 1.122683, top1: 0.57635, throughput: 313.25 | 2022-04-03 08:58:30.156 [rank:2] [train], epoch: 17/50, iter: 300/834, loss: 0.34099, lr: 1.122683, top1: 0.57339, throughput: 313.24 | 2022-04-03 08:58:30.170 [rank:0] [train], epoch: 17/50, iter: 300/834, loss: 0.33940, lr: 1.122683, top1: 0.58073, throughput: 313.59 | 2022-04-03 08:58:30.178 [rank:5] [train], epoch: 17/50, iter: 300/834, loss: 0.33908, lr: 1.122683, top1: 0.58000, throughput: 313.58 | 2022-04-03 08:58:30.183 [rank:7] [train], epoch: 17/50, iter: 300/834, loss: 0.33895, lr: 1.122683, top1: 0.57615, throughput: 313.35 | 2022-04-03 08:58:30.189 [rank:5] [train], epoch: 17/50, iter: 400/834, loss: 0.34059, lr: 1.117541, top1: 0.57760, throughput: 312.44 | 2022-04-03 08:59:31.635 [rank:3] [train], epoch: 17/50, iter: 400/834, loss: 0.33897, lr: 1.117541, top1: 0.57979, throughput: 312.22 | 2022-04-03 08:59:31.643 [rank:6] [train], epoch: 17/50, iter: 400/834, loss: 0.33857, lr: 1.117541, top1: 0.57896, throughput: 312.22 | 2022-04-03 08:59:31.650 [rank:2] [train], epoch: 17/50, iter: 400/834, loss: 0.34177, lr: 1.117541, top1: 0.57214, throughput: 312.29 | 2022-04-03 08:59:31.650 [rank:4] [train], epoch: 17/50, iter: 400/834, loss: 0.34198, lr: 1.117541, top1: 0.57656, throughput: 312.06 | 2022-04-03 08:59:31.653 [rank:1] [train], epoch: 17/50, iter: 400/834, loss: 0.34071, lr: 1.117541, top1: 0.57505, throughput: 312.11 | 2022-04-03 08:59:31.672 [rank:0] [train], epoch: 17/50, iter: 400/834, loss: 0.34189, lr: 1.117541, top1: 0.57344, throughput: 312.21 | 2022-04-03 08:59:31.675 [rank:7] [train], epoch: 17/50, iter: 400/834, loss: 0.34274, lr: 1.117541, top1: 0.56792, throughput: 312.25 | 2022-04-03 08:59:31.678 [rank:3] [train], epoch: 17/50, iter: 500/834, loss: 0.33742, lr: 1.112379, top1: 0.58026, throughput: 312.97 | 2022-04-03 09:00:32.991 [rank:0] [train], epoch: 17/50, iter: 500/834, loss: 0.34104, lr: 1.112379, top1: 0.57568, throughput: 312.94 | 2022-04-03 09:00:33.028 [rank:4] [train], epoch: 17/50, iter: 500/834, loss: 0.33734, lr: 1.112379, top1: 0.57474, throughput: 312.80 | 2022-04-03 09:00:33.034 [rank:2] [train], epoch: 17/50, iter: 500/834, loss: 0.33816, lr: 1.112379, top1: 0.57875, throughput: 312.78 | 2022-04-03 09:00:33.035 [rank:7] [train], epoch: 17/50, iter: 500/834, loss: 0.34027, lr: 1.112379, top1: 0.57703, throughput: 312.86 | 2022-04-03 09:00:33.047 [rank:5] [train], epoch: 17/50, iter: 500/834, loss: 0.34359, lr: 1.112379, top1: 0.57365, throughput: 312.64 | 2022-04-03 09:00:33.047 [rank:1] [train], epoch: 17/50, iter: 500/834, loss: 0.33858, lr: 1.112379, top1: 0.58016, throughput: 312.82 | 2022-04-03 09:00:33.049 [rank:6] [train], epoch: 17/50, iter: 500/834, loss: 0.33949, lr: 1.112379, top1: 0.58094, throughput: 313.03 | 2022-04-03 09:00:32.986 [rank:6] [train], epoch: 17/50, iter: 600/834, loss: 0.34148, lr: 1.107198, top1: 0.57177, throughput: 312.71 | 2022-04-03 09:01:34.385 [rank:1] [train], epoch: 17/50, iter: 600/834, loss: 0.33942, lr: 1.107198, top1: 0.57776, throughput: 312.92 | 2022-04-03 09:01:34.408 [rank:3] [train], epoch: 17/50, iter: 600/834, loss: 0.33951, lr: 1.107198, top1: 0.57318, throughput: 312.62 | 2022-04-03 09:01:34.408 [rank:2] [train], epoch: 17/50, iter: 600/834, loss: 0.33843, lr: 1.107198, top1: 0.58115, throughput: 312.77 | 2022-04-03 09:01:34.422 [rank:5] [train], epoch: 17/50, iter: 600/834, loss: 0.34133, lr: 1.107198, top1: 0.57432, throughput: 312.77 | 2022-04-03 09:01:34.435 [rank:7] [train], epoch: 17/50, iter: 600/834, loss: 0.33922, lr: 1.107198, top1: 0.58078, throughput: 312.73 | 2022-04-03 09:01:34.441 [rank:4] [train], epoch: 17/50, iter: 600/834, loss: 0.33906, lr: 1.107198, top1: 0.57589, throughput: 312.64 | 2022-04-03 09:01:34.447 [rank:0] [train], epoch: 17/50, iter: 600/834, loss: 0.34010, lr: 1.107198, top1: 0.57625, throughput: 312.51 | 2022-04-03 09:01:34.467 [rank:6] [train], epoch: 17/50, iter: 700/834, loss: 0.33999, lr: 1.101997, top1: 0.57661, throughput: 310.65 | 2022-04-03 09:02:36.190 [rank:5] [train], epoch: 17/50, iter: 700/834, loss: 0.34252, lr: 1.101997, top1: 0.56964, throughput: 310.86 | 2022-04-03 09:02:36.199 [rank:7] [train], epoch: 17/50, iter: 700/834, loss: 0.33720, lr: 1.101997, top1: 0.57734, throughput: 310.84 | 2022-04-03 09:02:36.208 [rank:1] [train], epoch: 17/50, iter: 700/834, loss: 0.34163, lr: 1.101997, top1: 0.57651, throughput: 310.49 | 2022-04-03 09:02:36.245 [rank:4] [train], epoch: 17/50, iter: 700/834, loss: 0.33938, lr: 1.101997, top1: 0.57568, throughput: 310.69 | 2022-04-03 09:02:36.246 [rank:3] [train], epoch: 17/50, iter: 700/834, loss: 0.34009, lr: 1.101997, top1: 0.57667, throughput: 310.39 | 2022-04-03 09:02:36.266 [rank:2] [train], epoch: 17/50, iter: 700/834, loss: 0.34287, lr: 1.101997, top1: 0.56781, throughput: 310.94 | 2022-04-03 09:02:36.170 [rank:0] [train], epoch: 17/50, iter: 700/834, loss: 0.33828, lr: 1.101997, top1: 0.57396, throughput: 310.97 | 2022-04-03 09:02:36.209 [rank:3] [train], epoch: 17/50, iter: 800/834, loss: 0.34123, lr: 1.096777, top1: 0.57198, throughput: 314.50 | 2022-04-03 09:03:37.315 [rank:5] [train], epoch: 17/50, iter: 800/834, loss: 0.33740, lr: 1.096777, top1: 0.58281, throughput: 314.10 | 2022-04-03 09:03:37.327 [rank:1] [train], epoch: 17/50, iter: 800/834, loss: 0.34119, lr: 1.096777, top1: 0.57542, throughput: 314.26 | 2022-04-03 09:03:37.341 [rank:6] [train], epoch: 17/50, iter: 800/834, loss: 0.33902, lr: 1.096777, top1: 0.57885, throughput: 313.98 | 2022-04-03 09:03:37.340 [rank:7] [train], epoch: 17/50, iter: 800/834, loss: 0.33989, lr: 1.096777, top1: 0.57927, throughput: 314.06 | 2022-04-03 09:03:37.343 [rank:4] [train], epoch: 17/50, iter: 800/834, loss: 0.33791, lr: 1.096777, top1: 0.57729, throughput: 314.20 | 2022-04-03 09:03:37.354 [rank:2] [train], epoch: 17/50, iter: 800/834, loss: 0.34238, lr: 1.096777, top1: 0.57120, throughput: 313.80 | 2022-04-03 09:03:37.355 [rank:0] [train], epoch: 17/50, iter: 800/834, loss: 0.34123, lr: 1.096777, top1: 0.57167, throughput: 313.81 | 2022-04-03 09:03:37.391 [rank:1] [train], epoch: 17/50, iter: 834/834, loss: 0.33571, lr: 1.094998, top1: 0.57353, throughput: 311.61 | 2022-04-03 09:03:58.290 [rank:0] [train], epoch: 17/50, iter: 834/834, loss: 0.34440, lr: 1.094998, top1: 0.56801, throughput: 312.32 | 2022-04-03 09:03:58.293 [rank:5] [train], epoch: 17/50, iter: 834/834, loss: 0.34528, lr: 1.094998, top1: 0.56480, throughput: 311.22 | 2022-04-03 09:03:58.303 [rank:7] [train], epoch: 17/50, iter: 834/834, loss: 0.33918, lr: 1.094998, top1: 0.57858, throughput: 311.36 | 2022-04-03 09:03:58.309 [rank:4] [train], epoch: 17/50, iter: 834/834, loss: 0.34219, lr: 1.094998, top1: 0.57261, throughput: 311.45 | 2022-04-03 09:03:58.314 [rank:2] [train], epoch: 17/50, iter: 834/834, loss: 0.34181, lr: 1.094998, top1: 0.56648, throughput: 311.45 | 2022-04-03 09:03:58.315 [rank:6] [train], epoch: 17/50, iter: 834/834, loss: 0.33821, lr: 1.094998, top1: 0.58379, throughput: 311.22 | 2022-04-03 09:03:58.316 [rank:3] [train], epoch: 17/50, iter: 834/834, loss: 0.33882, lr: 1.094998, top1: 0.57292, throughput: 310.79 | 2022-04-03 09:03:58.320 [rank:0] [eval], epoch: 17/50, iter: 125/125, loss: 0.00000, lr: 1.094998, top1: 0.58256, throughput: 488.29 | 2022-04-03 09:04:11.093 [rank:2] [eval], epoch: 17/50, iter: 125/125, loss: 0.00000, lr: 1.094998, top1: 0.58064, throughput: 488.91 | 2022-04-03 09:04:11.098 [rank:1] [eval], epoch: 17/50, iter: 125/125, loss: 0.00000, lr: 1.094998, top1: 0.58480, throughput: 487.93 | 2022-04-03 09:04:11.099 [rank:3] [eval], epoch: 17/50, iter: 125/125, loss: 0.00000, lr: 1.094998, top1: 0.57472, throughput: 488.82 | 2022-04-03 09:04:11.106 [rank:7] [eval], epoch: 17/50, iter: 125/125, loss: 0.00000, lr: 1.094998, top1: 0.57136, throughput: 488.17 | 2022-04-03 09:04:11.111 [rank:4] [eval], epoch: 17/50, iter: 125/125, loss: 0.00000, lr: 1.094998, top1: 0.58416, throughput: 488.30 | 2022-04-03 09:04:11.113 [rank:6] [eval], epoch: 17/50, iter: 125/125, loss: 0.00000, lr: 1.094998, top1: 0.57968, throughput: 487.98 | 2022-04-03 09:04:11.124 [rank:5] [eval], epoch: 17/50, iter: 125/125, loss: 0.00000, lr: 1.094998, top1: 0.57312, throughput: 486.70 | 2022-04-03 09:04:11.144 [rank:4] [train], epoch: 18/50, iter: 100/834, loss: 0.33588, lr: 1.089754, top1: 0.58208, throughput: 313.02 | 2022-04-03 09:05:12.452 [rank:5] [train], epoch: 18/50, iter: 100/834, loss: 0.33475, lr: 1.089754, top1: 0.58693, throughput: 312.93 | 2022-04-03 09:05:12.500 [rank:7] [train], epoch: 18/50, iter: 100/834, loss: 0.33442, lr: 1.089754, top1: 0.58318, throughput: 312.74 | 2022-04-03 09:05:12.504 [rank:2] [train], epoch: 18/50, iter: 100/834, loss: 0.33383, lr: 1.089754, top1: 0.58521, throughput: 312.64 | 2022-04-03 09:05:12.511 [rank:0] [train], epoch: 18/50, iter: 100/834, loss: 0.33531, lr: 1.089754, top1: 0.58401, throughput: 312.52 | 2022-04-03 09:05:12.528 [rank:1] [train], epoch: 18/50, iter: 100/834, loss: 0.33534, lr: 1.089754, top1: 0.58661, throughput: 312.49 | 2022-04-03 09:05:12.540 [rank:6] [train], epoch: 18/50, iter: 100/834, loss: 0.33222, lr: 1.089754, top1: 0.59219, throughput: 312.61 | 2022-04-03 09:05:12.542 [rank:3] [train], epoch: 18/50, iter: 100/834, loss: 0.32891, lr: 1.089754, top1: 0.59568, throughput: 312.41 | 2022-04-03 09:05:12.564 [rank:6] [train], epoch: 18/50, iter: 200/834, loss: 0.33277, lr: 1.084491, top1: 0.58719, throughput: 312.75 | 2022-04-03 09:06:13.934 [rank:7] [train], epoch: 18/50, iter: 200/834, loss: 0.33301, lr: 1.084491, top1: 0.58781, throughput: 312.51 | 2022-04-03 09:06:13.941 [rank:5] [train], epoch: 18/50, iter: 200/834, loss: 0.33668, lr: 1.084491, top1: 0.57896, throughput: 312.43 | 2022-04-03 09:06:13.953 [rank:1] [train], epoch: 18/50, iter: 200/834, loss: 0.33654, lr: 1.084491, top1: 0.58432, throughput: 312.53 | 2022-04-03 09:06:13.974 [rank:2] [train], epoch: 18/50, iter: 200/834, loss: 0.33676, lr: 1.084491, top1: 0.58297, throughput: 312.27 | 2022-04-03 09:06:13.996 [rank:0] [train], epoch: 18/50, iter: 200/834, loss: 0.33746, lr: 1.084491, top1: 0.57964, throughput: 312.35 | 2022-04-03 09:06:13.997 [rank:4] [train], epoch: 18/50, iter: 200/834, loss: 0.33641, lr: 1.084491, top1: 0.58495, throughput: 311.90 | 2022-04-03 09:06:14.010 [rank:3] [train], epoch: 18/50, iter: 200/834, loss: 0.33268, lr: 1.084491, top1: 0.58771, throughput: 312.95 | 2022-04-03 09:06:13.917 [rank:5] [train], epoch: 18/50, iter: 300/834, loss: 0.33216, lr: 1.079210, top1: 0.58927, throughput: 313.61 | 2022-04-03 09:07:15.176 [rank:4] [train], epoch: 18/50, iter: 300/834, loss: 0.33441, lr: 1.079210, top1: 0.58479, throughput: 313.67 | 2022-04-03 09:07:15.222 [rank:3] [train], epoch: 18/50, iter: 300/834, loss: 0.33601, lr: 1.079210, top1: 0.58375, throughput: 313.13 | 2022-04-03 09:07:15.233 [rank:1] [train], epoch: 18/50, iter: 300/834, loss: 0.33733, lr: 1.079210, top1: 0.58182, throughput: 313.42 | 2022-04-03 09:07:15.234 [rank:2] [train], epoch: 18/50, iter: 300/834, loss: 0.33643, lr: 1.079210, top1: 0.58214, throughput: 313.49 | 2022-04-03 09:07:15.241 [rank:0] [train], epoch: 18/50, iter: 300/834, loss: 0.33716, lr: 1.079210, top1: 0.58000, throughput: 313.40 | 2022-04-03 09:07:15.260 [rank:6] [train], epoch: 18/50, iter: 300/834, loss: 0.33547, lr: 1.079210, top1: 0.58589, throughput: 313.40 | 2022-04-03 09:07:15.198 [rank:7] [train], epoch: 18/50, iter: 300/834, loss: 0.33682, lr: 1.079210, top1: 0.58271, throughput: 313.41 | 2022-04-03 09:07:15.202 [rank:3] [train], epoch: 18/50, iter: 400/834, loss: 0.33504, lr: 1.073912, top1: 0.58635, throughput: 312.82 | 2022-04-03 09:08:16.609 [rank:4] [train], epoch: 18/50, iter: 400/834, loss: 0.33374, lr: 1.073912, top1: 0.58823, throughput: 312.76 | 2022-04-03 09:08:16.610 [rank:2] [train], epoch: 18/50, iter: 400/834, loss: 0.33461, lr: 1.073912, top1: 0.57891, throughput: 312.80 | 2022-04-03 09:08:16.623 [rank:6] [train], epoch: 18/50, iter: 400/834, loss: 0.33469, lr: 1.073912, top1: 0.58604, throughput: 312.54 | 2022-04-03 09:08:16.629 [rank:0] [train], epoch: 18/50, iter: 400/834, loss: 0.33688, lr: 1.073912, top1: 0.57964, throughput: 312.76 | 2022-04-03 09:08:16.649 [rank:1] [train], epoch: 18/50, iter: 400/834, loss: 0.33974, lr: 1.073912, top1: 0.57583, throughput: 312.59 | 2022-04-03 09:08:16.655 [rank:5] [train], epoch: 18/50, iter: 400/834, loss: 0.33659, lr: 1.073912, top1: 0.58224, throughput: 312.68 | 2022-04-03 09:08:16.580 [rank:7] [train], epoch: 18/50, iter: 400/834, loss: 0.33893, lr: 1.073912, top1: 0.57740, throughput: 312.21 | 2022-04-03 09:08:16.698 [rank:5] [train], epoch: 18/50, iter: 500/834, loss: 0.33688, lr: 1.068596, top1: 0.58276, throughput: 313.54 | 2022-04-03 09:09:17.816 [rank:7] [train], epoch: 18/50, iter: 500/834, loss: 0.33763, lr: 1.068596, top1: 0.57682, throughput: 313.90 | 2022-04-03 09:09:17.864 [rank:3] [train], epoch: 18/50, iter: 500/834, loss: 0.33620, lr: 1.068596, top1: 0.57557, throughput: 313.42 | 2022-04-03 09:09:17.869 [rank:2] [train], epoch: 18/50, iter: 500/834, loss: 0.33623, lr: 1.068596, top1: 0.58427, throughput: 313.44 | 2022-04-03 09:09:17.879 [rank:0] [train], epoch: 18/50, iter: 500/834, loss: 0.33871, lr: 1.068596, top1: 0.58031, throughput: 313.53 | 2022-04-03 09:09:17.886 [rank:4] [train], epoch: 18/50, iter: 500/834, loss: 0.33971, lr: 1.068596, top1: 0.57479, throughput: 313.33 | 2022-04-03 09:09:17.888 [rank:6] [train], epoch: 18/50, iter: 500/834, loss: 0.33801, lr: 1.068596, top1: 0.57755, throughput: 313.33 | 2022-04-03 09:09:17.905 [rank:1] [train], epoch: 18/50, iter: 500/834, loss: 0.33533, lr: 1.068596, top1: 0.58219, throughput: 313.85 | 2022-04-03 09:09:17.831 [rank:3] [train], epoch: 18/50, iter: 600/834, loss: 0.33806, lr: 1.063263, top1: 0.58120, throughput: 312.56 | 2022-04-03 09:10:19.296 [rank:0] [train], epoch: 18/50, iter: 600/834, loss: 0.33496, lr: 1.063263, top1: 0.58411, throughput: 312.59 | 2022-04-03 09:10:19.308 [rank:1] [train], epoch: 18/50, iter: 600/834, loss: 0.33682, lr: 1.063263, top1: 0.58438, throughput: 312.23 | 2022-04-03 09:10:19.324 [rank:5] [train], epoch: 18/50, iter: 600/834, loss: 0.33661, lr: 1.063263, top1: 0.58104, throughput: 312.10 | 2022-04-03 09:10:19.335 [rank:4] [train], epoch: 18/50, iter: 600/834, loss: 0.33807, lr: 1.063263, top1: 0.58151, throughput: 312.39 | 2022-04-03 09:10:19.350 [rank:2] [train], epoch: 18/50, iter: 600/834, loss: 0.33403, lr: 1.063263, top1: 0.58703, throughput: 312.33 | 2022-04-03 09:10:19.353 [rank:6] [train], epoch: 18/50, iter: 600/834, loss: 0.33904, lr: 1.063263, top1: 0.57307, throughput: 312.44 | 2022-04-03 09:10:19.358 [rank:7] [train], epoch: 18/50, iter: 600/834, loss: 0.33706, lr: 1.063263, top1: 0.58094, throughput: 312.22 | 2022-04-03 09:10:19.359 [rank:3] [train], epoch: 18/50, iter: 700/834, loss: 0.33636, lr: 1.057914, top1: 0.57979, throughput: 312.16 | 2022-04-03 09:11:20.804 [rank:1] [train], epoch: 18/50, iter: 700/834, loss: 0.33597, lr: 1.057914, top1: 0.58323, throughput: 312.23 | 2022-04-03 09:11:20.818 [rank:7] [train], epoch: 18/50, iter: 700/834, loss: 0.33981, lr: 1.057914, top1: 0.57781, throughput: 312.36 | 2022-04-03 09:11:20.826 [rank:6] [train], epoch: 18/50, iter: 700/834, loss: 0.33781, lr: 1.057914, top1: 0.58125, throughput: 312.35 | 2022-04-03 09:11:20.826 [rank:5] [train], epoch: 18/50, iter: 700/834, loss: 0.33995, lr: 1.057914, top1: 0.57714, throughput: 312.19 | 2022-04-03 09:11:20.836 [rank:0] [train], epoch: 18/50, iter: 700/834, loss: 0.33654, lr: 1.057914, top1: 0.58063, throughput: 311.99 | 2022-04-03 09:11:20.849 [rank:4] [train], epoch: 18/50, iter: 700/834, loss: 0.33740, lr: 1.057914, top1: 0.57922, throughput: 312.05 | 2022-04-03 09:11:20.878 [rank:2] [train], epoch: 18/50, iter: 700/834, loss: 0.33768, lr: 1.057914, top1: 0.58224, throughput: 312.49 | 2022-04-03 09:11:20.795 [rank:1] [train], epoch: 18/50, iter: 800/834, loss: 0.33831, lr: 1.052548, top1: 0.57917, throughput: 313.89 | 2022-04-03 09:12:21.985 [rank:5] [train], epoch: 18/50, iter: 800/834, loss: 0.33835, lr: 1.052548, top1: 0.58240, throughput: 313.92 | 2022-04-03 09:12:21.997 [rank:3] [train], epoch: 18/50, iter: 800/834, loss: 0.33627, lr: 1.052548, top1: 0.58234, throughput: 313.75 | 2022-04-03 09:12:21.998 [rank:0] [train], epoch: 18/50, iter: 800/834, loss: 0.33742, lr: 1.052548, top1: 0.57995, throughput: 313.83 | 2022-04-03 09:12:22.028 [rank:7] [train], epoch: 18/50, iter: 800/834, loss: 0.33701, lr: 1.052548, top1: 0.58281, throughput: 313.71 | 2022-04-03 09:12:22.030 [rank:2] [train], epoch: 18/50, iter: 800/834, loss: 0.34055, lr: 1.052548, top1: 0.57323, throughput: 313.48 | 2022-04-03 09:12:22.042 [rank:4] [train], epoch: 18/50, iter: 800/834, loss: 0.33686, lr: 1.052548, top1: 0.57885, throughput: 313.90 | 2022-04-03 09:12:22.043 [rank:6] [train], epoch: 18/50, iter: 800/834, loss: 0.33764, lr: 1.052548, top1: 0.58099, throughput: 313.59 | 2022-04-03 09:12:22.053 [rank:3] [train], epoch: 18/50, iter: 834/834, loss: 0.33658, lr: 1.050720, top1: 0.57950, throughput: 311.96 | 2022-04-03 09:12:42.923 [rank:5] [train], epoch: 18/50, iter: 834/834, loss: 0.33620, lr: 1.050720, top1: 0.57613, throughput: 311.88 | 2022-04-03 09:12:42.929 [rank:6] [train], epoch: 18/50, iter: 834/834, loss: 0.33512, lr: 1.050720, top1: 0.58471, throughput: 312.65 | 2022-04-03 09:12:42.932 [rank:1] [train], epoch: 18/50, iter: 834/834, loss: 0.33519, lr: 1.050720, top1: 0.58150, throughput: 311.63 | 2022-04-03 09:12:42.933 [rank:7] [train], epoch: 18/50, iter: 834/834, loss: 0.33717, lr: 1.050720, top1: 0.57644, throughput: 312.29 | 2022-04-03 09:12:42.934 [rank:0] [train], epoch: 18/50, iter: 834/834, loss: 0.33391, lr: 1.050720, top1: 0.58441, throughput: 312.11 | 2022-04-03 09:12:42.943 [rank:4] [train], epoch: 18/50, iter: 834/834, loss: 0.34193, lr: 1.050720, top1: 0.56924, throughput: 312.00 | 2022-04-03 09:12:42.966 [rank:2] [train], epoch: 18/50, iter: 834/834, loss: 0.33457, lr: 1.050720, top1: 0.58149, throughput: 311.82 | 2022-04-03 09:12:42.977 [rank:0] [eval], epoch: 18/50, iter: 125/125, loss: 0.00000, lr: 1.050720, top1: 0.57712, throughput: 489.72 | 2022-04-03 09:12:55.706 [rank:2] [eval], epoch: 18/50, iter: 125/125, loss: 0.00000, lr: 1.050720, top1: 0.57312, throughput: 491.01 | 2022-04-03 09:12:55.706 [rank:7] [eval], epoch: 18/50, iter: 125/125, loss: 0.00000, lr: 1.050720, top1: 0.56432, throughput: 488.95 | 2022-04-03 09:12:55.716 [rank:6] [eval], epoch: 18/50, iter: 125/125, loss: 0.00000, lr: 1.050720, top1: 0.56752, throughput: 488.50 | 2022-04-03 09:12:55.726 [rank:3] [eval], epoch: 18/50, iter: 125/125, loss: 0.00000, lr: 1.050720, top1: 0.56032, throughput: 488.13 | 2022-04-03 09:12:55.727 [rank:4] [eval], epoch: 18/50, iter: 125/125, loss: 0.00000, lr: 1.050720, top1: 0.57504, throughput: 489.69 | 2022-04-03 09:12:55.730 [rank:1] [eval], epoch: 18/50, iter: 125/125, loss: 0.00000, lr: 1.050720, top1: 0.57264, throughput: 488.39 | 2022-04-03 09:12:55.730 [rank:5] [eval], epoch: 18/50, iter: 125/125, loss: 0.00000, lr: 1.050720, top1: 0.56272, throughput: 487.23 | 2022-04-03 09:12:55.756 [rank:3] [train], epoch: 19/50, iter: 100/834, loss: 0.33297, lr: 1.045332, top1: 0.58906, throughput: 312.63 | 2022-04-03 09:13:57.141 [rank:7] [train], epoch: 19/50, iter: 100/834, loss: 0.33284, lr: 1.045332, top1: 0.58958, throughput: 312.53 | 2022-04-03 09:13:57.150 [rank:5] [train], epoch: 19/50, iter: 100/834, loss: 0.33199, lr: 1.045332, top1: 0.58714, throughput: 312.73 | 2022-04-03 09:13:57.151 [rank:0] [train], epoch: 19/50, iter: 100/834, loss: 0.32891, lr: 1.045332, top1: 0.59677, throughput: 312.46 | 2022-04-03 09:13:57.154 [rank:6] [train], epoch: 19/50, iter: 100/834, loss: 0.33268, lr: 1.045332, top1: 0.58719, throughput: 312.52 | 2022-04-03 09:13:57.163 [rank:1] [train], epoch: 19/50, iter: 100/834, loss: 0.32743, lr: 1.045332, top1: 0.60156, throughput: 312.54 | 2022-04-03 09:13:57.162 [rank:2] [train], epoch: 19/50, iter: 100/834, loss: 0.33006, lr: 1.045332, top1: 0.59130, throughput: 312.36 | 2022-04-03 09:13:57.175 [rank:4] [train], epoch: 19/50, iter: 100/834, loss: 0.32983, lr: 1.045332, top1: 0.59208, throughput: 312.39 | 2022-04-03 09:13:57.192 [rank:6] [train], epoch: 19/50, iter: 200/834, loss: 0.33169, lr: 1.039929, top1: 0.58932, throughput: 311.28 | 2022-04-03 09:14:58.844 [rank:3] [train], epoch: 19/50, iter: 200/834, loss: 0.33205, lr: 1.039929, top1: 0.58917, throughput: 311.12 | 2022-04-03 09:14:58.853 [rank:1] [train], epoch: 19/50, iter: 200/834, loss: 0.33110, lr: 1.039929, top1: 0.59125, throughput: 311.22 | 2022-04-03 09:14:58.856 [rank:7] [train], epoch: 19/50, iter: 200/834, loss: 0.32956, lr: 1.039929, top1: 0.59188, throughput: 311.08 | 2022-04-03 09:14:58.870 [rank:2] [train], epoch: 19/50, iter: 200/834, loss: 0.33529, lr: 1.039929, top1: 0.58484, throughput: 311.17 | 2022-04-03 09:14:58.877 [rank:5] [train], epoch: 19/50, iter: 200/834, loss: 0.33342, lr: 1.039929, top1: 0.58932, throughput: 311.05 | 2022-04-03 09:14:58.878 [rank:4] [train], epoch: 19/50, iter: 200/834, loss: 0.33345, lr: 1.039929, top1: 0.58307, throughput: 311.23 | 2022-04-03 09:14:58.882 [rank:0] [train], epoch: 19/50, iter: 200/834, loss: 0.32950, lr: 1.039929, top1: 0.59766, throughput: 310.90 | 2022-04-03 09:14:58.910 [rank:3] [train], epoch: 19/50, iter: 300/834, loss: 0.33126, lr: 1.034510, top1: 0.59099, throughput: 313.84 | 2022-04-03 09:16:00.032 [rank:5] [train], epoch: 19/50, iter: 300/834, loss: 0.33522, lr: 1.034510, top1: 0.57979, throughput: 313.86 | 2022-04-03 09:16:00.051 [rank:6] [train], epoch: 19/50, iter: 300/834, loss: 0.33208, lr: 1.034510, top1: 0.59073, throughput: 313.57 | 2022-04-03 09:16:00.073 [rank:4] [train], epoch: 19/50, iter: 300/834, loss: 0.33124, lr: 1.034510, top1: 0.59255, throughput: 313.75 | 2022-04-03 09:16:00.078 [rank:0] [train], epoch: 19/50, iter: 300/834, loss: 0.33344, lr: 1.034510, top1: 0.58870, throughput: 313.80 | 2022-04-03 09:16:00.095 [rank:1] [train], epoch: 19/50, iter: 300/834, loss: 0.33147, lr: 1.034510, top1: 0.59099, throughput: 313.49 | 2022-04-03 09:16:00.102 [rank:7] [train], epoch: 19/50, iter: 300/834, loss: 0.33109, lr: 1.034510, top1: 0.59422, throughput: 313.97 | 2022-04-03 09:16:00.022 [rank:2] [train], epoch: 19/50, iter: 300/834, loss: 0.33515, lr: 1.034510, top1: 0.58104, throughput: 313.51 | 2022-04-03 09:16:00.120 [rank:2] [train], epoch: 19/50, iter: 400/834, loss: 0.33478, lr: 1.029076, top1: 0.58427, throughput: 311.39 | 2022-04-03 09:17:01.779 [rank:1] [train], epoch: 19/50, iter: 400/834, loss: 0.33503, lr: 1.029076, top1: 0.58203, throughput: 311.15 | 2022-04-03 09:17:01.809 [rank:6] [train], epoch: 19/50, iter: 400/834, loss: 0.33038, lr: 1.029076, top1: 0.59568, throughput: 310.91 | 2022-04-03 09:17:01.828 [rank:7] [train], epoch: 19/50, iter: 400/834, loss: 0.33423, lr: 1.029076, top1: 0.58219, throughput: 310.61 | 2022-04-03 09:17:01.836 [rank:4] [train], epoch: 19/50, iter: 400/834, loss: 0.33304, lr: 1.029076, top1: 0.58990, throughput: 310.81 | 2022-04-03 09:17:01.853 [rank:5] [train], epoch: 19/50, iter: 400/834, loss: 0.33334, lr: 1.029076, top1: 0.58380, throughput: 310.63 | 2022-04-03 09:17:01.860 [rank:0] [train], epoch: 19/50, iter: 400/834, loss: 0.33216, lr: 1.029076, top1: 0.59130, throughput: 310.79 | 2022-04-03 09:17:01.874 [rank:3] [train], epoch: 19/50, iter: 400/834, loss: 0.33191, lr: 1.029076, top1: 0.59292, throughput: 310.94 | 2022-04-03 09:17:01.780 [rank:2] [train], epoch: 19/50, iter: 500/834, loss: 0.33086, lr: 1.023627, top1: 0.59286, throughput: 312.84 | 2022-04-03 09:18:03.153 [rank:6] [train], epoch: 19/50, iter: 500/834, loss: 0.33364, lr: 1.023627, top1: 0.58349, throughput: 312.92 | 2022-04-03 09:18:03.185 [rank:7] [train], epoch: 19/50, iter: 500/834, loss: 0.33534, lr: 1.023627, top1: 0.58552, throughput: 312.95 | 2022-04-03 09:18:03.188 [rank:0] [train], epoch: 19/50, iter: 500/834, loss: 0.33240, lr: 1.023627, top1: 0.59089, throughput: 313.13 | 2022-04-03 09:18:03.190 [rank:3] [train], epoch: 19/50, iter: 500/834, loss: 0.33478, lr: 1.023627, top1: 0.58641, throughput: 312.57 | 2022-04-03 09:18:03.207 [rank:5] [train], epoch: 19/50, iter: 500/834, loss: 0.33376, lr: 1.023627, top1: 0.58885, throughput: 312.89 | 2022-04-03 09:18:03.223 [rank:4] [train], epoch: 19/50, iter: 500/834, loss: 0.33259, lr: 1.023627, top1: 0.59031, throughput: 312.82 | 2022-04-03 09:18:03.229 [rank:1] [train], epoch: 19/50, iter: 500/834, loss: 0.33626, lr: 1.023627, top1: 0.58016, throughput: 312.39 | 2022-04-03 09:18:03.271 [rank:4] [train], epoch: 19/50, iter: 600/834, loss: 0.33218, lr: 1.018164, top1: 0.58734, throughput: 313.57 | 2022-04-03 09:19:04.459 [rank:7] [train], epoch: 19/50, iter: 600/834, loss: 0.33178, lr: 1.018164, top1: 0.58818, throughput: 313.13 | 2022-04-03 09:19:04.504 [rank:6] [train], epoch: 19/50, iter: 600/834, loss: 0.33401, lr: 1.018164, top1: 0.58688, throughput: 312.98 | 2022-04-03 09:19:04.530 [rank:2] [train], epoch: 19/50, iter: 600/834, loss: 0.33499, lr: 1.018164, top1: 0.58729, throughput: 312.76 | 2022-04-03 09:19:04.542 [rank:3] [train], epoch: 19/50, iter: 600/834, loss: 0.33631, lr: 1.018164, top1: 0.57859, throughput: 313.03 | 2022-04-03 09:19:04.543 [rank:5] [train], epoch: 19/50, iter: 600/834, loss: 0.33506, lr: 1.018164, top1: 0.58229, throughput: 313.10 | 2022-04-03 09:19:04.545 [rank:1] [train], epoch: 19/50, iter: 600/834, loss: 0.33626, lr: 1.018164, top1: 0.58109, throughput: 313.23 | 2022-04-03 09:19:04.569 [rank:0] [train], epoch: 19/50, iter: 600/834, loss: 0.33329, lr: 1.018164, top1: 0.58667, throughput: 313.20 | 2022-04-03 09:19:04.493 [rank:5] [train], epoch: 19/50, iter: 700/834, loss: 0.33418, lr: 1.012687, top1: 0.59016, throughput: 313.05 | 2022-04-03 09:20:05.877 [rank:1] [train], epoch: 19/50, iter: 700/834, loss: 0.33311, lr: 1.012687, top1: 0.58979, throughput: 313.15 | 2022-04-03 09:20:05.881 [rank:3] [train], epoch: 19/50, iter: 700/834, loss: 0.33495, lr: 1.012687, top1: 0.58479, throughput: 312.94 | 2022-04-03 09:20:05.896 [rank:6] [train], epoch: 19/50, iter: 700/834, loss: 0.33530, lr: 1.012687, top1: 0.58432, throughput: 312.82 | 2022-04-03 09:20:05.908 [rank:2] [train], epoch: 19/50, iter: 700/834, loss: 0.33225, lr: 1.012687, top1: 0.59068, throughput: 312.83 | 2022-04-03 09:20:05.917 [rank:0] [train], epoch: 19/50, iter: 700/834, loss: 0.33713, lr: 1.012687, top1: 0.58312, throughput: 312.54 | 2022-04-03 09:20:05.924 [rank:7] [train], epoch: 19/50, iter: 700/834, loss: 0.33456, lr: 1.012687, top1: 0.58120, throughput: 312.49 | 2022-04-03 09:20:05.946 [rank:4] [train], epoch: 19/50, iter: 700/834, loss: 0.33347, lr: 1.012687, top1: 0.58703, throughput: 312.23 | 2022-04-03 09:20:05.953 [rank:5] [train], epoch: 19/50, iter: 800/834, loss: 0.33221, lr: 1.007195, top1: 0.58656, throughput: 315.04 | 2022-04-03 09:21:06.822 [rank:3] [train], epoch: 19/50, iter: 800/834, loss: 0.33407, lr: 1.007195, top1: 0.58547, throughput: 315.11 | 2022-04-03 09:21:06.827 [rank:1] [train], epoch: 19/50, iter: 800/834, loss: 0.33401, lr: 1.007195, top1: 0.59036, throughput: 314.95 | 2022-04-03 09:21:06.843 [rank:0] [train], epoch: 19/50, iter: 800/834, loss: 0.33530, lr: 1.007195, top1: 0.58156, throughput: 315.14 | 2022-04-03 09:21:06.849 [rank:4] [train], epoch: 19/50, iter: 800/834, loss: 0.33472, lr: 1.007195, top1: 0.58276, throughput: 315.27 | 2022-04-03 09:21:06.854 [rank:2] [train], epoch: 19/50, iter: 800/834, loss: 0.33607, lr: 1.007195, top1: 0.58068, throughput: 314.95 | 2022-04-03 09:21:06.880 [rank:7] [train], epoch: 19/50, iter: 800/834, loss: 0.33234, lr: 1.007195, top1: 0.58714, throughput: 315.05 | 2022-04-03 09:21:06.888 [rank:6] [train], epoch: 19/50, iter: 800/834, loss: 0.33280, lr: 1.007195, top1: 0.58932, throughput: 314.81 | 2022-04-03 09:21:06.897 [rank:5] [train], epoch: 19/50, iter: 834/834, loss: 0.33364, lr: 1.005325, top1: 0.58318, throughput: 310.83 | 2022-04-03 09:21:27.824 [rank:2] [train], epoch: 19/50, iter: 834/834, loss: 0.32982, lr: 1.005325, top1: 0.60064, throughput: 310.94 | 2022-04-03 09:21:27.874 [rank:3] [train], epoch: 19/50, iter: 834/834, loss: 0.33865, lr: 1.005325, top1: 0.58180, throughput: 310.01[rank:7] [train], epoch: 19/50, iter: 834/834, loss: 0.33195, lr: 1.005325, top1: 0.58195, throughput: 310.91 | 2022-04-03 09:21:27.884 | 2022-04-03 09:21:27.884 [rank:0] [train], epoch: 19/50, iter: 834/834, loss: 0.33112, lr: 1.005325, top1: 0.59222, throughput: 310.26 | 2022-04-03 09:21:27.889 [rank:4] [train], epoch: 19/50, iter: 834/834, loss: 0.33565, lr: 1.005325, top1: 0.58624, throughput: 310.27 | 2022-04-03 09:21:27.893 [rank:6] [train], epoch: 19/50, iter: 834/834, loss: 0.33349, lr: 1.005325, top1: 0.58578, throughput: 310.71 | 2022-04-03 09:21:27.907 [rank:1] [train], epoch: 19/50, iter: 834/834, loss: 0.33482, lr: 1.005325, top1: 0.58624, throughput: 309.76 | 2022-04-03 09:21:27.918 [rank:0] [eval], epoch: 19/50, iter: 125/125, loss: 0.00000, lr: 1.005325, top1: 0.55328, throughput: 491.85 | 2022-04-03 09:21:40.596 [rank:2] [eval], epoch: 19/50, iter: 125/125, loss: 0.00000, lr: 1.005325, top1: 0.54688, throughput: 490.95 | 2022-04-03 09:21:40.604 [rank:1] [eval], epoch: 19/50, iter: 125/125, loss: 0.00000, lr: 1.005325, top1: 0.54576, throughput: 492.62 | 2022-04-03 09:21:40.605 [rank:6] [eval], epoch: 19/50, iter: 125/125, loss: 0.00000, lr: 1.005325, top1: 0.54512, throughput: 491.78 | 2022-04-03 09:21:40.616 [rank:4] [eval], epoch: 19/50, iter: 125/125, loss: 0.00000, lr: 1.005325, top1: 0.54224, throughput: 491.24 | 2022-04-03 09:21:40.616 [rank:7] [eval], epoch: 19/50, iter: 125/125, loss: 0.00000, lr: 1.005325, top1: 0.54288, throughput: 490.78 | 2022-04-03 09:21:40.619 [rank:3] [eval], epoch: 19/50, iter: 125/125, loss: 0.00000, lr: 1.005325, top1: 0.53728, throughput: 490.52 | 2022-04-03 09:21:40.626 [rank:5] [eval], epoch: 19/50, iter: 125/125, loss: 0.00000, lr: 1.005325, top1: 0.53376, throughput: 487.50 | 2022-04-03 09:21:40.645 [rank:6] [train], epoch: 20/50, iter: 100/834, loss: 0.32576, lr: 0.999816, top1: 0.60505, throughput: 313.22 | 2022-04-03 09:22:41.916 [rank:5] [train], epoch: 20/50, iter: 100/834, loss: 0.32864, lr: 0.999816, top1: 0.60094, throughput: 313.14 | 2022-04-03 09:22:41.960 [rank:3] [train], epoch: 20/50, iter: 100/834, loss: 0.32649, lr: 0.999816, top1: 0.59958, throughput: 313.01 | 2022-04-03 09:22:41.967 [rank:2] [train], epoch: 20/50, iter: 100/834, loss: 0.32537, lr: 0.999816, top1: 0.60245, throughput: 312.76 | 2022-04-03 09:22:41.993 [rank:1] [train], epoch: 20/50, iter: 100/834, loss: 0.32878, lr: 0.999816, top1: 0.59349, throughput: 312.74 | 2022-04-03 09:22:41.998 [rank:0] [train], epoch: 20/50, iter: 100/834, loss: 0.32626, lr: 0.999816, top1: 0.60052, throughput: 312.55 | 2022-04-03 09:22:42.026 [rank:7] [train], epoch: 20/50, iter: 100/834, loss: 0.32736, lr: 0.999816, top1: 0.59885, throughput: 312.49 | 2022-04-03 09:22:42.060 [rank:4] [train], epoch: 20/50, iter: 100/834, loss: 0.32762, lr: 0.999816, top1: 0.59474, throughput: 312.48 | 2022-04-03 09:22:42.060 [rank:7] [train], epoch: 20/50, iter: 200/834, loss: 0.32564, lr: 0.994293, top1: 0.60307, throughput: 313.32 | 2022-04-03 09:23:43.339 [rank:6] [train], epoch: 20/50, iter: 200/834, loss: 0.32943, lr: 0.994293, top1: 0.59401, throughput: 312.52 | 2022-04-03 09:23:43.353 [rank:3] [train], epoch: 20/50, iter: 200/834, loss: 0.33171, lr: 0.994293, top1: 0.58703, throughput: 312.70 | 2022-04-03 09:23:43.368 [rank:0] [train], epoch: 20/50, iter: 200/834, loss: 0.32905, lr: 0.994293, top1: 0.59432, throughput: 313.00 | 2022-04-03 09:23:43.368 [rank:2] [train], epoch: 20/50, iter: 200/834, loss: 0.32588, lr: 0.994293, top1: 0.60234, throughput: 312.79 | 2022-04-03 09:23:43.377 [rank:1] [train], epoch: 20/50, iter: 200/834, loss: 0.32867, lr: 0.994293, top1: 0.59729, throughput: 312.79 | 2022-04-03 09:23:43.380 [rank:5] [train], epoch: 20/50, iter: 200/834, loss: 0.32947, lr: 0.994293, top1: 0.59672, throughput: 312.57 | 2022-04-03 09:23:43.385 [rank:4] [train], epoch: 20/50, iter: 200/834, loss: 0.32833, lr: 0.994293, top1: 0.59734, throughput: 312.90 | 2022-04-03 09:23:43.423 [rank:2] [train], epoch: 20/50, iter: 300/834, loss: 0.32851, lr: 0.988758, top1: 0.59573, throughput: 312.47 | 2022-04-03 09:24:44.824 [rank:0] [train], epoch: 20/50, iter: 300/834, loss: 0.33157, lr: 0.988758, top1: 0.59094, throughput: 312.33 | 2022-04-03 09:24:44.841 [rank:4] [train], epoch: 20/50, iter: 300/834, loss: 0.33198, lr: 0.988758, top1: 0.58865, throughput: 312.52 | 2022-04-03 09:24:44.859 [rank:3] [train], epoch: 20/50, iter: 300/834, loss: 0.33038, lr: 0.988758, top1: 0.59229, throughput: 312.23 | 2022-04-03 09:24:44.861 [rank:1] [train], epoch: 20/50, iter: 300/834, loss: 0.32716, lr: 0.988758, top1: 0.60130, throughput: 312.21 | 2022-04-03 09:24:44.877 [rank:5] [train], epoch: 20/50, iter: 300/834, loss: 0.33121, lr: 0.988758, top1: 0.59120, throughput: 312.23 | 2022-04-03 09:24:44.878 [rank:6] [train], epoch: 20/50, iter: 300/834, loss: 0.33159, lr: 0.988758, top1: 0.59297, throughput: 312.03 | 2022-04-03 09:24:44.884 [rank:7] [train], epoch: 20/50, iter: 300/834, loss: 0.33088, lr: 0.988758, top1: 0.59198, throughput: 311.83 | 2022-04-03 09:24:44.911 [rank:5] [train], epoch: 20/50, iter: 400/834, loss: 0.33150, lr: 0.983210, top1: 0.58953, throughput: 313.37 | 2022-04-03 09:25:46.148 [rank:7] [train], epoch: 20/50, iter: 400/834, loss: 0.33239, lr: 0.983210, top1: 0.59047, throughput: 313.53 | 2022-04-03 09:25:46.148 [rank:3] [train], epoch: 20/50, iter: 400/834, loss: 0.32899, lr: 0.983210, top1: 0.59698, throughput: 313.08 | 2022-04-03 09:25:46.187 [rank:2] [train], epoch: 20/50, iter: 400/834, loss: 0.32986, lr: 0.983210, top1: 0.59495, throughput: 312.85 | 2022-04-03 09:25:46.195 [rank:4] [train], epoch: 20/50, iter: 400/834, loss: 0.32841, lr: 0.983210, top1: 0.59599, throughput: 313.02 | 2022-04-03 09:25:46.196 [rank:0] [train], epoch: 20/50, iter: 400/834, loss: 0.33125, lr: 0.983210, top1: 0.58844, throughput: 312.93 | 2022-04-03 09:25:46.196 [rank:1] [train], epoch: 20/50, iter: 400/834, loss: 0.32976, lr: 0.983210, top1: 0.59286, throughput: 313.03 | 2022-04-03 09:25:46.212 [rank:6] [train], epoch: 20/50, iter: 400/834, loss: 0.32796, lr: 0.983210, top1: 0.59484, throughput: 313.46 | 2022-04-03 09:25:46.137 [rank:2] [train], epoch: 20/50, iter: 500/834, loss: 0.32948, lr: 0.977649, top1: 0.59161, throughput: 313.42 | 2022-04-03 09:26:47.454 [rank:4] [train], epoch: 20/50, iter: 500/834, loss: 0.32945, lr: 0.977649, top1: 0.59562, throughput: 313.35 | 2022-04-03 09:26:47.470 [rank:3] [train], epoch: 20/50, iter: 500/834, loss: 0.33210, lr: 0.977649, top1: 0.58823, throughput: 313.21 | 2022-04-03 09:26:47.488 [rank:6] [train], epoch: 20/50, iter: 500/834, loss: 0.33135, lr: 0.977649, top1: 0.59500, throughput: 312.92 | 2022-04-03 09:26:47.495 [rank:0] [train], epoch: 20/50, iter: 500/834, loss: 0.33312, lr: 0.977649, top1: 0.58927, throughput: 313.21 | 2022-04-03 09:26:47.497 [rank:7] [train], epoch: 20/50, iter: 500/834, loss: 0.32958, lr: 0.977649, top1: 0.59740, throughput: 312.88 | 2022-04-03 09:26:47.514 [rank:1] [train], epoch: 20/50, iter: 500/834, loss: 0.32859, lr: 0.977649, top1: 0.59443, throughput: 313.63 | 2022-04-03 09:26:47.431 [rank:5] [train], epoch: 20/50, iter: 500/834, loss: 0.33015, lr: 0.977649, top1: 0.59437, throughput: 312.77 | 2022-04-03 09:26:47.534 [rank:1] [train], epoch: 20/50, iter: 600/834, loss: 0.33190, lr: 0.972077, top1: 0.58812, throughput: 312.96 | 2022-04-03 09:27:48.781 [rank:3] [train], epoch: 20/50, iter: 600/834, loss: 0.33180, lr: 0.972077, top1: 0.58995, throughput: 313.10 | 2022-04-03 09:27:48.811 [rank:5] [train], epoch: 20/50, iter: 600/834, loss: 0.33194, lr: 0.972077, top1: 0.58839, throughput: 313.28 | 2022-04-03 09:27:48.821 [rank:0] [train], epoch: 20/50, iter: 600/834, loss: 0.33196, lr: 0.972077, top1: 0.58870, throughput: 312.99 | 2022-04-03 09:27:48.840 [rank:2] [train], epoch: 20/50, iter: 600/834, loss: 0.33162, lr: 0.972077, top1: 0.59031, throughput: 312.69 | 2022-04-03 09:27:48.857 [rank:4] [train], epoch: 20/50, iter: 600/834, loss: 0.33066, lr: 0.972077, top1: 0.59464, throughput: 312.73 | 2022-04-03 09:27:48.865 [rank:6] [train], epoch: 20/50, iter: 600/834, loss: 0.33246, lr: 0.972077, top1: 0.59135, throughput: 312.86 | 2022-04-03 09:27:48.864 [rank:7] [train], epoch: 20/50, iter: 600/834, loss: 0.33156, lr: 0.972077, top1: 0.59031, throughput: 312.85 | 2022-04-03 09:27:48.886 [rank:6] [train], epoch: 20/50, iter: 700/834, loss: 0.33307, lr: 0.966494, top1: 0.58693, throughput: 313.32 | 2022-04-03 09:28:50.143 [rank:4] [train], epoch: 20/50, iter: 700/834, loss: 0.33193, lr: 0.966494, top1: 0.59083, throughput: 313.32 | 2022-04-03 09:28:50.145 [rank:1] [train], epoch: 20/50, iter: 700/834, loss: 0.33132, lr: 0.966494, top1: 0.59693, throughput: 312.85 | 2022-04-03 09:28:50.153 [rank:0] [train], epoch: 20/50, iter: 700/834, loss: 0.33177, lr: 0.966494, top1: 0.58693, throughput: 313.04 | 2022-04-03 09:28:50.174 [rank:2] [train], epoch: 20/50, iter: 700/834, loss: 0.33133, lr: 0.966494, top1: 0.59771, throughput: 313.12 | 2022-04-03 09:28:50.174 [rank:5] [train], epoch: 20/50, iter: 700/834, loss: 0.32941, lr: 0.966494, top1: 0.59568, throughput: 312.83 | 2022-04-03 09:28:50.196 [rank:3] [train], epoch: 20/50, iter: 700/834, loss: 0.32893, lr: 0.966494, top1: 0.59432, throughput: 312.74 | 2022-04-03 09:28:50.203 [rank:7] [train], epoch: 20/50, iter: 700/834, loss: 0.33026, lr: 0.966494, top1: 0.59161, throughput: 313.48 | 2022-04-03 09:28:50.134 [rank:1] [train], epoch: 20/50, iter: 800/834, loss: 0.33282, lr: 0.960899, top1: 0.58922, throughput: 312.69 | 2022-04-03 09:29:51.556 [rank:3] [train], epoch: 20/50, iter: 800/834, loss: 0.33263, lr: 0.960899, top1: 0.59078, throughput: 312.89 | 2022-04-03 09:29:51.566 [rank:0] [train], epoch: 20/50, iter: 800/834, loss: 0.32972, lr: 0.960899, top1: 0.59870, throughput: 312.71 | 2022-04-03 09:29:51.573 [rank:5] [train], epoch: 20/50, iter: 800/834, loss: 0.33332, lr: 0.960899, top1: 0.58260, throughput: 312.81 | 2022-04-03 09:29:51.575 [rank:6] [train], epoch: 20/50, iter: 800/834, loss: 0.33218, lr: 0.960899, top1: 0.58958, throughput: 312.50 | 2022-04-03 09:29:51.584 [rank:4] [train], epoch: 20/50, iter: 800/834, loss: 0.33028, lr: 0.960899, top1: 0.59437, throughput: 312.41 | 2022-04-03 09:29:51.603 [rank:2] [train], epoch: 20/50, iter: 800/834, loss: 0.33126, lr: 0.960899, top1: 0.59260, throughput: 312.49 | 2022-04-03 09:29:51.617 [rank:7] [train], epoch: 20/50, iter: 800/834, loss: 0.33281, lr: 0.960899, top1: 0.58776, throughput: 312.25 | 2022-04-03 09:29:51.623 [rank:3] [train], epoch: 20/50, iter: 834/834, loss: 0.33246, lr: 0.958994, top1: 0.58578, throughput: 315.12 | 2022-04-03 09:30:12.282 [rank:2] [train], epoch: 20/50, iter: 834/834, loss: 0.33387, lr: 0.958994, top1: 0.58425, throughput: 315.88 | 2022-04-03 09:30:12.283 [rank:5] [train], epoch: 20/50, iter: 834/834, loss: 0.32869, lr: 0.958994, top1: 0.59498, throughput: 315.22 | 2022-04-03 09:30:12.285 [rank:4] [train], epoch: 20/50, iter: 834/834, loss: 0.32991, lr: 0.958994, top1: 0.59023, throughput: 315.64 | 2022-04-03 09:30:12.285 [rank:6] [train], epoch: 20/50, iter: 834/834, loss: 0.33091, lr: 0.958994, top1: 0.58869, throughput: 315.26 | 2022-04-03 09:30:12.291 [rank:1] [train], epoch: 20/50, iter: 834/834, loss: 0.33101, lr: 0.958994, top1: 0.59145, throughput: 314.81 | 2022-04-03 09:30:12.292 [rank:7] [train], epoch: 20/50, iter: 834/834, loss: 0.33404, lr: 0.958994, top1: 0.58624, throughput: 315.77 | 2022-04-03 09:30:12.297 [rank:0] [train], epoch: 20/50, iter: 834/834, loss: 0.33126, lr: 0.958994, top1: 0.60064, throughput: 314.94 | 2022-04-03 09:30:12.300 [rank:1] [eval], epoch: 20/50, iter: 125/125, loss: 0.00000, lr: 0.958994, top1: 0.58128, throughput: 499.93 | 2022-04-03 09:30:24.794 [rank:0] [eval], epoch: 20/50, iter: 125/125, loss: 0.00000, lr: 0.958994, top1: 0.59232, throughput: 500.22 | 2022-04-03 09:30:24.795 [rank:2] [eval], epoch: 20/50, iter: 125/125, loss: 0.00000, lr: 0.958994, top1: 0.56864, throughput: 499.47 | 2022-04-03 09:30:24.796 [rank:7] [eval], epoch: 20/50, iter: 125/125, loss: 0.00000, lr: 0.958994, top1: 0.57984, throughput: 499.29 | 2022-04-03 09:30:24.814 [rank:6] [eval], epoch: 20/50, iter: 125/125, loss: 0.00000, lr: 0.958994, top1: 0.57424, throughput: 498.83 | 2022-04-03 09:30:24.820 [rank:4] [eval], epoch: 20/50, iter: 125/125, loss: 0.00000, lr: 0.958994, top1: 0.57808, throughput: 498.09 | 2022-04-03 09:30:24.833 [rank:3] [eval], epoch: 20/50, iter: 125/125, loss: 0.00000, lr: 0.958994, top1: 0.57328, throughput: 497.94 | 2022-04-03 09:30:24.834 [rank:5] [eval], epoch: 20/50, iter: 125/125, loss: 0.00000, lr: 0.958994, top1: 0.56752, throughput: 496.48 | 2022-04-03 09:30:24.873 [rank:0] [train], epoch: 21/50, iter: 100/834, loss: 0.32732, lr: 0.953384, top1: 0.59620, throughput: 311.55 | 2022-04-03 09:31:26.422 [rank:3] [train], epoch: 21/50, iter: 100/834, loss: 0.32308, lr: 0.953384, top1: 0.60536, throughput: 311.67 | 2022-04-03 09:31:26.437 [rank:1] [train], epoch: 21/50, iter: 100/834, loss: 0.32534, lr: 0.953384, top1: 0.59979, throughput: 311.35 | 2022-04-03 09:31:26.461 [rank:4] [train], epoch: 21/50, iter: 100/834, loss: 0.32482, lr: 0.953384, top1: 0.60370, throughput: 311.47 | 2022-04-03 09:31:26.477 [rank:6] [train], epoch: 21/50, iter: 100/834, loss: 0.32695, lr: 0.953384, top1: 0.60083, throughput: 311.35 | 2022-04-03 09:31:26.487 [rank:5] [train], epoch: 21/50, iter: 100/834, loss: 0.32588, lr: 0.953384, top1: 0.59797, throughput: 311.57 | 2022-04-03 09:31:26.497 [rank:7] [train], epoch: 21/50, iter: 100/834, loss: 0.32000, lr: 0.953384, top1: 0.61635, throughput: 311.25 | 2022-04-03 09:31:26.501 [rank:2] [train], epoch: 21/50, iter: 100/834, loss: 0.32433, lr: 0.953384, top1: 0.60589, throughput: 311.14 | 2022-04-03 09:31:26.505 [rank:3] [train], epoch: 21/50, iter: 200/834, loss: 0.32893, lr: 0.947764, top1: 0.59641, throughput: 312.94 | 2022-04-03 09:32:27.790 [rank:2] [train], epoch: 21/50, iter: 200/834, loss: 0.32612, lr: 0.947764, top1: 0.60240, throughput: 313.04 | 2022-04-03 09:32:27.840 [rank:1] [train], epoch: 21/50, iter: 200/834, loss: 0.32761, lr: 0.947764, top1: 0.59635, throughput: 312.78 | 2022-04-03 09:32:27.847 [rank:5] [train], epoch: 21/50, iter: 200/834, loss: 0.32442, lr: 0.947764, top1: 0.60286, throughput: 312.77 | 2022-04-03 09:32:27.884 [rank:6] [train], epoch: 21/50, iter: 200/834, loss: 0.32811, lr: 0.947764, top1: 0.59844, throughput: 312.72 | 2022-04-03 09:32:27.884 [rank:7] [train], epoch: 21/50, iter: 200/834, loss: 0.32744, lr: 0.947764, top1: 0.59953, throughput: 312.76 | 2022-04-03 09:32:27.889 [rank:0] [train], epoch: 21/50, iter: 200/834, loss: 0.32861, lr: 0.947764, top1: 0.59453, throughput: 312.31 | 2022-04-03 09:32:27.899 [rank:4] [train], epoch: 21/50, iter: 200/834, loss: 0.32693, lr: 0.947764, top1: 0.60104, throughput: 312.96 | 2022-04-03 09:32:27.827 [rank:1] [train], epoch: 21/50, iter: 300/834, loss: 0.32704, lr: 0.942134, top1: 0.59729, throughput: 313.74 | 2022-04-03 09:33:29.043 [rank:2] [train], epoch: 21/50, iter: 300/834, loss: 0.32372, lr: 0.942134, top1: 0.60448, throughput: 313.68 | 2022-04-03 09:33:29.049 [rank:5] [train], epoch: 21/50, iter: 300/834, loss: 0.32658, lr: 0.942134, top1: 0.60104, throughput: 313.88 | 2022-04-03 09:33:29.053 [rank:6] [train], epoch: 21/50, iter: 300/834, loss: 0.33034, lr: 0.942134, top1: 0.59401, throughput: 313.86 | 2022-04-03 09:33:29.058 [rank:7] [train], epoch: 21/50, iter: 300/834, loss: 0.32617, lr: 0.942134, top1: 0.60260, throughput: 313.87 | 2022-04-03 09:33:29.060 [rank:4] [train], epoch: 21/50, iter: 300/834, loss: 0.32749, lr: 0.942134, top1: 0.59927, throughput: 313.50 | 2022-04-03 09:33:29.070 [rank:0] [train], epoch: 21/50, iter: 300/834, loss: 0.32867, lr: 0.942134, top1: 0.60016, throughput: 313.87 | 2022-04-03 09:33:29.071 [rank:3] [train], epoch: 21/50, iter: 300/834, loss: 0.32624, lr: 0.942134, top1: 0.60208, throughput: 313.26 | 2022-04-03 09:33:29.080 [rank:1] [train], epoch: 21/50, iter: 400/834, loss: 0.32890, lr: 0.936494, top1: 0.59750, throughput: 313.91 | 2022-04-03 09:34:30.208 [rank:3] [train], epoch: 21/50, iter: 400/834, loss: 0.32881, lr: 0.936494, top1: 0.59490, throughput: 314.06 | 2022-04-03 09:34:30.215 [rank:7] [train], epoch: 21/50, iter: 400/834, loss: 0.32582, lr: 0.936494, top1: 0.59849, throughput: 313.82 | 2022-04-03 09:34:30.242 [rank:5] [train], epoch: 21/50, iter: 400/834, loss: 0.32991, lr: 0.936494, top1: 0.59745, throughput: 313.76 | 2022-04-03 09:34:30.245 [rank:6] [train], epoch: 21/50, iter: 400/834, loss: 0.32881, lr: 0.936494, top1: 0.59568, throughput: 313.78 | 2022-04-03 09:34:30.247 [rank:0] [train], epoch: 21/50, iter: 400/834, loss: 0.32754, lr: 0.936494, top1: 0.60083, throughput: 313.79 | 2022-04-03 09:34:30.260 [rank:4] [train], epoch: 21/50, iter: 400/834, loss: 0.32929, lr: 0.936494, top1: 0.59266, throughput: 313.71 | 2022-04-03 09:34:30.274 [rank:2] [train], epoch: 21/50, iter: 400/834, loss: 0.32993, lr: 0.936494, top1: 0.59021, throughput: 313.54 | 2022-04-03 09:34:30.285 [rank:5] [train], epoch: 21/50, iter: 500/834, loss: 0.32716, lr: 0.930844, top1: 0.59880, throughput: 313.15 | 2022-04-03 09:35:31.559 [rank:3] [train], epoch: 21/50, iter: 500/834, loss: 0.32585, lr: 0.930844, top1: 0.59552, throughput: 312.94 | 2022-04-03 09:35:31.568 [rank:2] [train], epoch: 21/50, iter: 500/834, loss: 0.32821, lr: 0.930844, top1: 0.59974, throughput: 313.15 | 2022-04-03 09:35:31.598 [rank:6] [train], epoch: 21/50, iter: 500/834, loss: 0.32861, lr: 0.930844, top1: 0.59656, throughput: 312.95 | 2022-04-03 09:35:31.599 [rank:1] [train], epoch: 21/50, iter: 500/834, loss: 0.32735, lr: 0.930844, top1: 0.60240, throughput: 312.62 | 2022-04-03 09:35:31.624 [rank:4] [train], epoch: 21/50, iter: 500/834, loss: 0.32676, lr: 0.930844, top1: 0.60047, throughput: 312.88 | 2022-04-03 09:35:31.640 [rank:0] [train], epoch: 21/50, iter: 500/834, loss: 0.32742, lr: 0.930844, top1: 0.59958, throughput: 312.80 | 2022-04-03 09:35:31.640 [rank:7] [train], epoch: 21/50, iter: 500/834, loss: 0.32837, lr: 0.930844, top1: 0.59682, throughput: 313.05 | 2022-04-03 09:35:31.574 [rank:1] [train], epoch: 21/50, iter: 600/834, loss: 0.32607, lr: 0.925185, top1: 0.60453, throughput: 312.62 | 2022-04-03 09:36:33.041 [rank:2] [train], epoch: 21/50, iter: 600/834, loss: 0.32699, lr: 0.925185, top1: 0.59854, throughput: 312.45 | 2022-04-03 09:36:33.048 [rank:4] [train], epoch: 21/50, iter: 600/834, loss: 0.33008, lr: 0.925185, top1: 0.59531, throughput: 312.63 | 2022-04-03 09:36:33.053 [rank:6] [train], epoch: 21/50, iter: 600/834, loss: 0.32694, lr: 0.925185, top1: 0.60177, throughput: 312.41 | 2022-04-03 09:36:33.057 [rank:7] [train], epoch: 21/50, iter: 600/834, loss: 0.33072, lr: 0.925185, top1: 0.59406, throughput: 312.14 | 2022-04-03 09:36:33.085 [rank:5] [train], epoch: 21/50, iter: 600/834, loss: 0.32671, lr: 0.925185, top1: 0.60266, throughput: 311.98 | 2022-04-03 09:36:33.100 [rank:3] [train], epoch: 21/50, iter: 600/834, loss: 0.32921, lr: 0.925185, top1: 0.59536, throughput: 312.03 | 2022-04-03 09:36:33.101 [rank:0] [train], epoch: 21/50, iter: 600/834, loss: 0.32978, lr: 0.925185, top1: 0.59427, throughput: 312.29 | 2022-04-03 09:36:33.121 [rank:7] [train], epoch: 21/50, iter: 700/834, loss: 0.32981, lr: 0.919517, top1: 0.59453, throughput: 313.72 | 2022-04-03 09:37:34.287 [rank:5] [train], epoch: 21/50, iter: 700/834, loss: 0.33027, lr: 0.919517, top1: 0.59583, throughput: 313.65 | 2022-04-03 09:37:34.316 [rank:1] [train], epoch: 21/50, iter: 700/834, loss: 0.33097, lr: 0.919517, top1: 0.59240, throughput: 313.34 | 2022-04-03 09:37:34.317 [rank:3] [train], epoch: 21/50, iter: 700/834, loss: 0.32946, lr: 0.919517, top1: 0.60068, throughput: 313.59 | 2022-04-03 09:37:34.328 [rank:6] [train], epoch: 21/50, iter: 700/834, loss: 0.32907, lr: 0.919517, top1: 0.59536, throughput: 313.33 | 2022-04-03 09:37:34.334 [rank:4] [train], epoch: 21/50, iter: 700/834, loss: 0.32531, lr: 0.919517, top1: 0.60406, throughput: 313.31 | 2022-04-03 09:37:34.334 [rank:0] [train], epoch: 21/50, iter: 700/834, loss: 0.33191, lr: 0.919517, top1: 0.58828, throughput: 313.60 | 2022-04-03 09:37:34.346 [rank:2] [train], epoch: 21/50, iter: 700/834, loss: 0.33123, lr: 0.919517, top1: 0.59401, throughput: 313.19 | 2022-04-03 09:37:34.353 [rank:3] [train], epoch: 21/50, iter: 800/834, loss: 0.32755, lr: 0.913841, top1: 0.59938, throughput: 313.29 | 2022-04-03 09:38:35.613 [rank:4] [train], epoch: 21/50, iter: 800/834, loss: 0.32842, lr: 0.913841, top1: 0.59609, throughput: 313.28 | 2022-04-03 09:38:35.621 [rank:1] [train], epoch: 21/50, iter: 800/834, loss: 0.32921, lr: 0.913841, top1: 0.59380, throughput: 312.90 | 2022-04-03 09:38:35.679 [rank:7] [train], epoch: 21/50, iter: 800/834, loss: 0.32810, lr: 0.913841, top1: 0.59687, throughput: 312.72 | 2022-04-03 09:38:35.684 [rank:2] [train], epoch: 21/50, iter: 800/834, loss: 0.32779, lr: 0.913841, top1: 0.59484, throughput: 313.05 | 2022-04-03 09:38:35.685 [rank:6] [train], epoch: 21/50, iter: 800/834, loss: 0.32598, lr: 0.913841, top1: 0.60167, throughput: 313.35 | 2022-04-03 09:38:35.606 [rank:0] [train], epoch: 21/50, iter: 800/834, loss: 0.32796, lr: 0.913841, top1: 0.59766, throughput: 313.22 | 2022-04-03 09:38:35.644 [rank:5] [train], epoch: 21/50, iter: 800/834, loss: 0.32734, lr: 0.913841, top1: 0.59505, throughput: 312.37 | 2022-04-03 09:38:35.781 [rank:0] [train], epoch: 21/50, iter: 834/834, loss: 0.33121, lr: 0.911909, top1: 0.59206, throughput: 312.13 | 2022-04-03 09:38:56.559 [rank:1] [train], epoch: 21/50, iter: 834/834, loss: 0.32845, lr: 0.911909, top1: 0.59773, throughput: 312.00 | 2022-04-03 09:38:56.602 [rank:2] [train], epoch: 21/50, iter: 834/834, loss: 0.32743, lr: 0.911909, top1: 0.59850, throughput: 311.77 | 2022-04-03 09:38:56.623 [rank:5] [train], epoch: 21/50, iter: 834/834, loss: 0.32705, lr: 0.911909, top1: 0.60110, throughput: 313.13 | 2022-04-03 09:38:56.629 [rank:4] [train], epoch: 21/50, iter: 834/834, loss: 0.32471, lr: 0.911909, top1: 0.61075, throughput: 310.64 | 2022-04-03 09:38:56.636 [rank:7] [train], epoch: 21/50, iter: 834/834, loss: 0.32980, lr: 0.911909, top1: 0.58808, throughput: 311.19 | 2022-04-03 09:38:56.662 [rank:6] [train], epoch: 21/50, iter: 834/834, loss: 0.32848, lr: 0.911909, top1: 0.58946, throughput: 310.02 | 2022-04-03 09:38:56.663 [rank:3] [train], epoch: 21/50, iter: 834/834, loss: 0.32489, lr: 0.911909, top1: 0.60800, throughput: 310.06 | 2022-04-03 09:38:56.666 [rank:2] [eval], epoch: 21/50, iter: 125/125, loss: 0.00000, lr: 0.911909, top1: 0.58944, throughput: 488.37 | 2022-04-03 09:39:09.420 [rank:7] [eval], epoch: 21/50, iter: 125/125, loss: 0.00000, lr: 0.911909, top1: 0.59376, throughput: 489.79 | 2022-04-03 09:39:09.423 [rank:0] [eval], epoch: 21/50, iter: 125/125, loss: 0.00000, lr: 0.911909, top1: 0.59456, throughput: 485.81 | 2022-04-03 09:39:09.424 [rank:3] [eval], epoch: 21/50, iter: 125/125, loss: 0.00000, lr: 0.911909, top1: 0.58336, throughput: 489.89 | 2022-04-03 09:39:09.424 [rank:5] [eval], epoch: 21/50, iter: 125/125, loss: 0.00000, lr: 0.911909, top1: 0.58064, throughput: 488.38 | 2022-04-03 09:39:09.426 [rank:1] [eval], epoch: 21/50, iter: 125/125, loss: 0.00000, lr: 0.911909, top1: 0.59216, throughput: 486.92 | 2022-04-03 09:39:09.437 [rank:6] [eval], epoch: 21/50, iter: 125/125, loss: 0.00000, lr: 0.911909, top1: 0.59376, throughput: 489.10 | 2022-04-03 09:39:09.442 [rank:4] [eval], epoch: 21/50, iter: 125/125, loss: 0.00000, lr: 0.911909, top1: 0.59120, throughput: 487.72 | 2022-04-03 09:39:09.450 [rank:3] [train], epoch: 22/50, iter: 100/834, loss: 0.31737, lr: 0.906221, top1: 0.61932, throughput: 312.99 | 2022-04-03 09:40:10.769 [rank:0] [train], epoch: 22/50, iter: 100/834, loss: 0.32403, lr: 0.906221, top1: 0.60005, throughput: 312.77 | 2022-04-03 09:40:10.810 [rank:1] [train], epoch: 22/50, iter: 100/834, loss: 0.31931, lr: 0.906221, top1: 0.61432, throughput: 312.80 | 2022-04-03 09:40:10.818 [rank:5] [train], epoch: 22/50, iter: 100/834, loss: 0.32651, lr: 0.906221, top1: 0.59833, throughput: 312.69 | 2022-04-03 09:40:10.829 [rank:4] [train], epoch: 22/50, iter: 100/834, loss: 0.32277, lr: 0.906221, top1: 0.60406, throughput: 312.75 | 2022-04-03 09:40:10.841 [rank:2] [train], epoch: 22/50, iter: 100/834, loss: 0.32238, lr: 0.906221, top1: 0.61203, throughput: 312.59 | 2022-04-03 09:40:10.843 [rank:7] [train], epoch: 22/50, iter: 100/834, loss: 0.32524, lr: 0.906221, top1: 0.60245, throughput: 312.58 | 2022-04-03 09:40:10.847 [rank:6] [train], epoch: 22/50, iter: 100/834, loss: 0.32467, lr: 0.906221, top1: 0.60344, throughput: 312.53 | 2022-04-03 09:40:10.875 [rank:5] [train], epoch: 22/50, iter: 200/834, loss: 0.32487, lr: 0.900526, top1: 0.59844, throughput: 312.32 | 2022-04-03 09:41:12.305 [rank:1] [train], epoch: 22/50, iter: 200/834, loss: 0.32445, lr: 0.900526, top1: 0.60599, throughput: 312.18 | 2022-04-03 09:41:12.322 [rank:7] [train], epoch: 22/50, iter: 200/834, loss: 0.32527, lr: 0.900526, top1: 0.60505, throughput: 312.31 | 2022-04-03 09:41:12.324 [rank:2] [train], epoch: 22/50, iter: 200/834, loss: 0.32201, lr: 0.900526, top1: 0.60469, throughput: 312.22 | 2022-04-03 09:41:12.339 [rank:4] [train], epoch: 22/50, iter: 200/834, loss: 0.32263, lr: 0.900526, top1: 0.60260, throughput: 311.97 | 2022-04-03 09:41:12.385 [rank:3] [train], epoch: 22/50, iter: 200/834, loss: 0.32237, lr: 0.900526, top1: 0.60531, throughput: 311.55 | 2022-04-03 09:41:12.395 [rank:6] [train], epoch: 22/50, iter: 200/834, loss: 0.32565, lr: 0.900526, top1: 0.60042, throughput: 311.96 | 2022-04-03 09:41:12.421 [rank:0] [train], epoch: 22/50, iter: 200/834, loss: 0.32111, lr: 0.900526, top1: 0.61349, throughput: 311.62 | 2022-04-03 09:41:12.423 [rank:2] [train], epoch: 22/50, iter: 300/834, loss: 0.32542, lr: 0.894823, top1: 0.60307, throughput: 312.33 | 2022-04-03 09:42:13.813 [rank:1] [train], epoch: 22/50, iter: 300/834, loss: 0.32533, lr: 0.894823, top1: 0.60187, throughput: 312.13 | 2022-04-03 09:42:13.834 [rank:3] [train], epoch: 22/50, iter: 300/834, loss: 0.32428, lr: 0.894823, top1: 0.60120, throughput: 312.46 | 2022-04-03 09:42:13.842 [rank:5] [train], epoch: 22/50, iter: 300/834, loss: 0.32555, lr: 0.894823, top1: 0.60490, throughput: 311.93 | 2022-04-03 09:42:13.858 [rank:7] [train], epoch: 22/50, iter: 300/834, loss: 0.32413, lr: 0.894823, top1: 0.60484, throughput: 312.02 | 2022-04-03 09:42:13.858 [rank:0] [train], epoch: 22/50, iter: 300/834, loss: 0.32839, lr: 0.894823, top1: 0.59599, throughput: 312.50 | 2022-04-03 09:42:13.863 [rank:4] [train], epoch: 22/50, iter: 300/834, loss: 0.32486, lr: 0.894823, top1: 0.60474, throughput: 312.28 | 2022-04-03 09:42:13.869 [rank:6] [train], epoch: 22/50, iter: 300/834, loss: 0.32633, lr: 0.894823, top1: 0.60016, throughput: 312.45 | 2022-04-03 09:42:13.872 [rank:3] [train], epoch: 22/50, iter: 400/834, loss: 0.32415, lr: 0.889113, top1: 0.60365, throughput: 313.47 | 2022-04-03 09:43:15.092 [rank:1] [train], epoch: 22/50, iter: 400/834, loss: 0.32734, lr: 0.889113, top1: 0.59865, throughput: 313.32 | 2022-04-03 09:43:15.112 [rank:4] [train], epoch: 22/50, iter: 400/834, loss: 0.32574, lr: 0.889113, top1: 0.60245, throughput: 313.43 | 2022-04-03 09:43:15.127 [rank:0] [train], epoch: 22/50, iter: 400/834, loss: 0.32574, lr: 0.889113, top1: 0.60594, throughput: 313.35 | 2022-04-03 09:43:15.136 [rank:6] [train], epoch: 22/50, iter: 400/834, loss: 0.32131, lr: 0.889113, top1: 0.60974, throughput: 313.36 | 2022-04-03 09:43:15.144 [rank:5] [train], epoch: 22/50, iter: 400/834, loss: 0.32339, lr: 0.889113, top1: 0.60792, throughput: 313.28 | 2022-04-03 09:43:15.145 [rank:2] [train], epoch: 22/50, iter: 400/834, loss: 0.32439, lr: 0.889113, top1: 0.60609, throughput: 312.96 | 2022-04-03 09:43:15.163 [rank:7] [train], epoch: 22/50, iter: 400/834, loss: 0.32367, lr: 0.889113, top1: 0.60781, throughput: 313.62 | 2022-04-03 09:43:15.078 [rank:6] [train], epoch: 22/50, iter: 500/834, loss: 0.32593, lr: 0.883396, top1: 0.60318, throughput: 314.57 | 2022-04-03 09:44:16.178 [rank:1] [train], epoch: 22/50, iter: 500/834, loss: 0.32630, lr: 0.883396, top1: 0.60052, throughput: 314.29 | 2022-04-03 09:44:16.203 [rank:3] [train], epoch: 22/50, iter: 500/834, loss: 0.32779, lr: 0.883396, top1: 0.59849, throughput: 314.16 | 2022-04-03 09:44:16.207 [rank:5] [train], epoch: 22/50, iter: 500/834, loss: 0.32553, lr: 0.883396, top1: 0.60057, throughput: 314.43 | 2022-04-03 09:44:16.208 [rank:4] [train], epoch: 22/50, iter: 500/834, loss: 0.32645, lr: 0.883396, top1: 0.60068, throughput: 314.29 | 2022-04-03 09:44:16.218 [rank:7] [train], epoch: 22/50, iter: 500/834, loss: 0.32583, lr: 0.883396, top1: 0.60422, throughput: 313.89 | 2022-04-03 09:44:16.246 [rank:0] [train], epoch: 22/50, iter: 500/834, loss: 0.32439, lr: 0.883396, top1: 0.60297, throughput: 314.59 | 2022-04-03 09:44:16.168 [rank:2] [train], epoch: 22/50, iter: 500/834, loss: 0.32613, lr: 0.883396, top1: 0.59849, throughput: 314.73 | 2022-04-03 09:44:16.168 [rank:1] [train], epoch: 22/50, iter: 600/834, loss: 0.32512, lr: 0.877673, top1: 0.60323, throughput: 312.19 | 2022-04-03 09:45:17.705 [rank:4] [train], epoch: 22/50, iter: 600/834, loss: 0.32255, lr: 0.877673, top1: 0.61047, throughput: 312.11 | 2022-04-03 09:45:17.734 [rank:0] [train], epoch: 22/50, iter: 600/834, loss: 0.32532, lr: 0.877673, top1: 0.60219, throughput: 311.77 | 2022-04-03 09:45:17.750 [rank:6] [train], epoch: 22/50, iter: 600/834, loss: 0.32587, lr: 0.877673, top1: 0.60219, throughput: 311.78 | 2022-04-03 09:45:17.761 [rank:2] [train], epoch: 22/50, iter: 600/834, loss: 0.32379, lr: 0.877673, top1: 0.60542, throughput: 311.71 | 2022-04-03 09:45:17.763 [rank:5] [train], epoch: 22/50, iter: 600/834, loss: 0.32413, lr: 0.877673, top1: 0.60802, throughput: 311.91 | 2022-04-03 09:45:17.764 [rank:7] [train], epoch: 22/50, iter: 600/834, loss: 0.32564, lr: 0.877673, top1: 0.60031, throughput: 311.99 | 2022-04-03 09:45:17.786 [rank:3] [train], epoch: 22/50, iter: 600/834, loss: 0.32435, lr: 0.877673, top1: 0.60391, throughput: 312.24 | 2022-04-03 09:45:17.697 [rank:5] [train], epoch: 22/50, iter: 700/834, loss: 0.32776, lr: 0.871943, top1: 0.59771, throughput: 311.90 | 2022-04-03 09:46:19.322 [rank:7] [train], epoch: 22/50, iter: 700/834, loss: 0.32798, lr: 0.871943, top1: 0.59359, throughput: 311.97 | 2022-04-03 09:46:19.330 [rank:3] [train], epoch: 22/50, iter: 700/834, loss: 0.32568, lr: 0.871943, top1: 0.60708, throughput: 311.49 | 2022-04-03 09:46:19.336 [rank:1] [train], epoch: 22/50, iter: 700/834, loss: 0.32545, lr: 0.871943, top1: 0.60359, throughput: 311.49 | 2022-04-03 09:46:19.344 [rank:2] [train], epoch: 22/50, iter: 700/834, loss: 0.32321, lr: 0.871943, top1: 0.61094, throughput: 311.73 | 2022-04-03 09:46:19.355 [rank:4] [train], epoch: 22/50, iter: 700/834, loss: 0.32448, lr: 0.871943, top1: 0.60542, throughput: 311.56 | 2022-04-03 09:46:19.360 [rank:0] [train], epoch: 22/50, iter: 700/834, loss: 0.32434, lr: 0.871943, top1: 0.60396, throughput: 311.64 | 2022-04-03 09:46:19.360 [rank:6] [train], epoch: 22/50, iter: 700/834, loss: 0.32809, lr: 0.871943, top1: 0.59875, throughput: 311.55 | 2022-04-03 09:46:19.389 [rank:6] [train], epoch: 22/50, iter: 800/834, loss: 0.32355, lr: 0.866207, top1: 0.60385, throughput: 313.97 | 2022-04-03 09:47:20.542 [rank:5] [train], epoch: 22/50, iter: 800/834, loss: 0.32801, lr: 0.866207, top1: 0.59891, throughput: 313.62 | 2022-04-03 09:47:20.543 [rank:3] [train], epoch: 22/50, iter: 800/834, loss: 0.32523, lr: 0.866207, top1: 0.60161, throughput: 313.62 | 2022-04-03 09:47:20.557 [rank:2] [train], epoch: 22/50, iter: 800/834, loss: 0.32565, lr: 0.866207, top1: 0.60172, throughput: 313.67 | 2022-04-03 09:47:20.566 [rank:0] [train], epoch: 22/50, iter: 800/834, loss: 0.32350, lr: 0.866207, top1: 0.60760, throughput: 313.58 | 2022-04-03 09:47:20.588 [rank:7] [train], epoch: 22/50, iter: 800/834, loss: 0.32783, lr: 0.866207, top1: 0.59500, throughput: 313.41 | 2022-04-03 09:47:20.592 [rank:1] [train], epoch: 22/50, iter: 800/834, loss: 0.32180, lr: 0.866207, top1: 0.60974, throughput: 313.33 | 2022-04-03 09:47:20.622 [rank:4] [train], epoch: 22/50, iter: 800/834, loss: 0.32366, lr: 0.866207, top1: 0.60365, throughput: 313.84 | 2022-04-03 09:47:20.537 [rank:5] [train], epoch: 22/50, iter: 834/834, loss: 0.32314, lr: 0.864256, top1: 0.60555, throughput: 310.72 | 2022-04-03 09:47:41.553 [rank:2] [train], epoch: 22/50, iter: 834/834, loss: 0.32623, lr: 0.864256, top1: 0.59896, throughput: 310.23 | 2022-04-03 09:47:41.609 [rank:3] [train], epoch: 22/50, iter: 834/834, loss: 0.32627, lr: 0.864256, top1: 0.60080, throughput: 310.02 | 2022-04-03 09:47:41.614 [rank:7] [train], epoch: 22/50, iter: 834/834, loss: 0.32283, lr: 0.864256, top1: 0.60064, throughput: 310.44 | 2022-04-03 09:47:41.620 [rank:4] [train], epoch: 22/50, iter: 834/834, loss: 0.32593, lr: 0.864256, top1: 0.60386, throughput: 309.60 | 2022-04-03 09:47:41.622 [rank:0] [train], epoch: 22/50, iter: 834/834, loss: 0.32349, lr: 0.864256, top1: 0.61137, throughput: 310.30 | 2022-04-03 09:47:41.626 [rank:1] [train], epoch: 22/50, iter: 834/834, loss: 0.32545, lr: 0.864256, top1: 0.60018, throughput: 310.65 | 2022-04-03 09:47:41.636 [rank:6] [train], epoch: 22/50, iter: 834/834, loss: 0.32781, lr: 0.864256, top1: 0.59819, throughput: 309.08 | 2022-04-03 09:47:41.662 [rank:0] [eval], epoch: 22/50, iter: 125/125, loss: 0.00000, lr: 0.864256, top1: 0.58912, throughput: 487.48 | 2022-04-03 09:47:54.447 [rank:2] [eval], epoch: 22/50, iter: 125/125, loss: 0.00000, lr: 0.864256, top1: 0.57792, throughput: 486.52 | 2022-04-03 09:47:54.455 [rank:3] [eval], epoch: 22/50, iter: 125/125, loss: 0.00000, lr: 0.864256, top1: 0.57168, throughput: 486.40 | 2022-04-03 09:47:54.463 [rank:5] [eval], epoch: 22/50, iter: 125/125, loss: 0.00000, lr: 0.864256, top1: 0.57296, throughput: 483.98 | 2022-04-03 09:47:54.467 [rank:7] [eval], epoch: 22/50, iter: 125/125, loss: 0.00000, lr: 0.864256, top1: 0.58208, throughput: 486.48 | 2022-04-03 09:47:54.468 [rank:1] [eval], epoch: 22/50, iter: 125/125, loss: 0.00000, lr: 0.864256, top1: 0.57984, throughput: 487.02 | 2022-04-03 09:47:54.469 [rank:6] [eval], epoch: 22/50, iter: 125/125, loss: 0.00000, lr: 0.864256, top1: 0.58624, throughput: 487.76 | 2022-04-03 09:47:54.476 [rank:4] [eval], epoch: 22/50, iter: 125/125, loss: 0.00000, lr: 0.864256, top1: 0.58400, throughput: 485.30 | 2022-04-03 09:47:54.501 [rank:5] [train], epoch: 23/50, iter: 100/834, loss: 0.32102, lr: 0.858513, top1: 0.61385, throughput: 313.10 | 2022-04-03 09:48:55.788 [rank:0] [train], epoch: 23/50, iter: 100/834, loss: 0.31739, lr: 0.858513, top1: 0.61391, throughput: 312.91 | 2022-04-03 09:48:55.806 [rank:2] [train], epoch: 23/50, iter: 100/834, loss: 0.31975, lr: 0.858513, top1: 0.61307, throughput: 312.84 | 2022-04-03 09:48:55.827 [rank:1] [train], epoch: 23/50, iter: 100/834, loss: 0.31510, lr: 0.858513, top1: 0.62313, throughput: 312.76[rank:7] [train], epoch: 23/50, iter: 100/834, loss: 0.31795, lr: 0.858513, top1: 0.61667, throughput: 312.75 | 2022-04-03 09:48:55.859| 2022-04-03 09:48:55.859 [rank:3] [train], epoch: 23/50, iter: 100/834, loss: 0.31853, lr: 0.858513, top1: 0.61974, throughput: 312.69 | 2022-04-03 09:48:55.866 [rank:6] [train], epoch: 23/50, iter: 100/834, loss: 0.32147, lr: 0.858513, top1: 0.60422, throughput: 312.66 | 2022-04-03 09:48:55.885 [rank:4] [train], epoch: 23/50, iter: 100/834, loss: 0.32247, lr: 0.858513, top1: 0.60870, throughput: 312.78 | 2022-04-03 09:48:55.886 [rank:2] [train], epoch: 23/50, iter: 200/834, loss: 0.32107, lr: 0.852765, top1: 0.60911, throughput: 312.02 | 2022-04-03 09:49:57.362 [rank:5] [train], epoch: 23/50, iter: 200/834, loss: 0.32517, lr: 0.852765, top1: 0.60307, throughput: 311.75 | 2022-04-03 09:49:57.377 [rank:7] [train], epoch: 23/50, iter: 200/834, loss: 0.32099, lr: 0.852765, top1: 0.60849, throughput: 312.00 | 2022-04-03 09:49:57.396 [rank:1] [train], epoch: 23/50, iter: 200/834, loss: 0.31975, lr: 0.852765, top1: 0.60906, throughput: 311.94 | 2022-04-03 09:49:57.409 [rank:6] [train], epoch: 23/50, iter: 200/834, loss: 0.32056, lr: 0.852765, top1: 0.61318, throughput: 311.97 | 2022-04-03 09:49:57.429 [rank:4] [train], epoch: 23/50, iter: 200/834, loss: 0.32080, lr: 0.852765, top1: 0.60844, throughput: 311.94 | 2022-04-03 09:49:57.436 [rank:0] [train], epoch: 23/50, iter: 200/834, loss: 0.31960, lr: 0.852765, top1: 0.61380, throughput: 311.50 | 2022-04-03 09:49:57.444 [rank:3] [train], epoch: 23/50, iter: 200/834, loss: 0.31775, lr: 0.852765, top1: 0.61839, throughput: 311.80 | 2022-04-03 09:49:57.444 [rank:2] [train], epoch: 23/50, iter: 300/834, loss: 0.32136, lr: 0.847012, top1: 0.60984, throughput: 312.01 | 2022-04-03 09:50:58.898 [rank:4] [train], epoch: 23/50, iter: 300/834, loss: 0.31998, lr: 0.847012, top1: 0.61000, throughput: 312.22 | 2022-04-03 09:50:58.931 [rank:6] [train], epoch: 23/50, iter: 300/834, loss: 0.32082, lr: 0.847012, top1: 0.60839, throughput: 312.12 | 2022-04-03 09:50:58.944 [rank:5] [train], epoch: 23/50, iter: 300/834, loss: 0.32090, lr: 0.847012, top1: 0.61094, throughput: 311.85 | 2022-04-03 09:50:58.946 [rank:1] [train], epoch: 23/50, iter: 300/834, loss: 0.32189, lr: 0.847012, top1: 0.60661, throughput: 311.90 | 2022-04-03 09:50:58.968 [rank:0] [train], epoch: 23/50, iter: 300/834, loss: 0.31784, lr: 0.847012, top1: 0.61307, throughput: 312.06 | 2022-04-03 09:50:58.971 [rank:3] [train], epoch: 23/50, iter: 300/834, loss: 0.32049, lr: 0.847012, top1: 0.61271, throughput: 312.01 | 2022-04-03 09:50:58.980 [rank:7] [train], epoch: 23/50, iter: 300/834, loss: 0.32098, lr: 0.847012, top1: 0.60891, throughput: 311.63 | 2022-04-03 09:50:59.007 [rank:5] [train], epoch: 23/50, iter: 400/834, loss: 0.32036, lr: 0.841254, top1: 0.61141, throughput: 313.50 | 2022-04-03 09:52:00.189 [rank:6] [train], epoch: 23/50, iter: 400/834, loss: 0.32236, lr: 0.841254, top1: 0.60609, throughput: 313.35 | 2022-04-03 09:52:00.218 [rank:3] [train], epoch: 23/50, iter: 400/834, loss: 0.32064, lr: 0.841254, top1: 0.61328, throughput: 313.53 | 2022-04-03 09:52:00.218 [rank:7] [train], epoch: 23/50, iter: 400/834, loss: 0.32150, lr: 0.841254, top1: 0.60667, throughput: 313.62 | 2022-04-03 09:52:00.228 [rank:1] [train], epoch: 23/50, iter: 400/834, loss: 0.32267, lr: 0.841254, top1: 0.60964, throughput: 313.39 | 2022-04-03 09:52:00.233 [rank:4] [train], epoch: 23/50, iter: 400/834, loss: 0.32477, lr: 0.841254, top1: 0.60599, throughput: 313.17 | 2022-04-03 09:52:00.239 [rank:2] [train], epoch: 23/50, iter: 400/834, loss: 0.32176, lr: 0.841254, top1: 0.60661, throughput: 312.88 | 2022-04-03 09:52:00.263 [rank:0] [train], epoch: 23/50, iter: 400/834, loss: 0.32069, lr: 0.841254, top1: 0.61276, throughput: 313.21 | 2022-04-03 09:52:00.271 [rank:2] [train], epoch: 23/50, iter: 500/834, loss: 0.32536, lr: 0.835493, top1: 0.59854, throughput: 313.66 | 2022-04-03 09:53:01.477 [rank:5] [train], epoch: 23/50, iter: 500/834, loss: 0.32095, lr: 0.835493, top1: 0.61234, throughput: 313.27 | 2022-04-03 09:53:01.479 [rank:4] [train], epoch: 23/50, iter: 500/834, loss: 0.32358, lr: 0.835493, top1: 0.60370, throughput: 313.35 | 2022-04-03 09:53:01.513 [rank:0] [train], epoch: 23/50, iter: 500/834, loss: 0.32374, lr: 0.835493, top1: 0.60432, throughput: 313.45 | 2022-04-03 09:53:01.525 [rank:1] [train], epoch: 23/50, iter: 500/834, loss: 0.32510, lr: 0.835493, top1: 0.60646, throughput: 313.25 | 2022-04-03 09:53:01.526 [rank:6] [train], epoch: 23/50, iter: 500/834, loss: 0.32215, lr: 0.835493, top1: 0.60797, throughput: 313.17 | 2022-04-03 09:53:01.526 [rank:7] [train], epoch: 23/50, iter: 500/834, loss: 0.32216, lr: 0.835493, top1: 0.60875, throughput: 313.20 | 2022-04-03 09:53:01.530 [rank:3] [train], epoch: 23/50, iter: 500/834, loss: 0.32034, lr: 0.835493, top1: 0.61036, throughput: 313.14 | 2022-04-03 09:53:01.533 [rank:1] [train], epoch: 23/50, iter: 600/834, loss: 0.32094, lr: 0.829727, top1: 0.60995, throughput: 313.61 | 2022-04-03 09:54:02.748 [rank:2] [train], epoch: 23/50, iter: 600/834, loss: 0.32373, lr: 0.829727, top1: 0.60552, throughput: 313.25 | 2022-04-03 09:54:02.770 [rank:3] [train], epoch: 23/50, iter: 600/834, loss: 0.32452, lr: 0.829727, top1: 0.60318, throughput: 313.51 | 2022-04-03 09:54:02.775 [rank:7] [train], epoch: 23/50, iter: 600/834, loss: 0.32124, lr: 0.829727, top1: 0.61135, throughput: 313.33 | 2022-04-03 09:54:02.808 [rank:0] [train], epoch: 23/50, iter: 600/834, loss: 0.31969, lr: 0.829727, top1: 0.61156, throughput: 313.24 | 2022-04-03 09:54:02.820 [rank:5] [train], epoch: 23/50, iter: 600/834, loss: 0.32030, lr: 0.829727, top1: 0.61151, throughput: 312.89 | 2022-04-03 09:54:02.842 [rank:4] [train], epoch: 23/50, iter: 600/834, loss: 0.32274, lr: 0.829727, top1: 0.60542, throughput: 313.06 | 2022-04-03 09:54:02.843 [rank:6] [train], epoch: 23/50, iter: 600/834, loss: 0.32271, lr: 0.829727, top1: 0.61437, throughput: 313.08 | 2022-04-03 09:54:02.853 [rank:4] [train], epoch: 23/50, iter: 700/834, loss: 0.31965, lr: 0.823958, top1: 0.61198, throughput: 313.37 | 2022-04-03 09:55:04.112 [rank:3] [train], epoch: 23/50, iter: 700/834, loss: 0.32306, lr: 0.823958, top1: 0.60641, throughput: 312.91 | 2022-04-03 09:55:04.136 [rank:1] [train], epoch: 23/50, iter: 700/834, loss: 0.32153, lr: 0.823958, top1: 0.61151, throughput: 312.74 | 2022-04-03 09:55:04.141 [rank:7] [train], epoch: 23/50, iter: 700/834, loss: 0.32236, lr: 0.823958, top1: 0.60823, throughput: 313.03 | 2022-04-03 09:55:04.143 [rank:6] [train], epoch: 23/50, iter: 700/834, loss: 0.32123, lr: 0.823958, top1: 0.61208, throughput: 313.16 | 2022-04-03 09:55:04.163 [rank:5] [train], epoch: 23/50, iter: 700/834, loss: 0.32263, lr: 0.823958, top1: 0.60667, throughput: 313.05 | 2022-04-03 09:55:04.173 [rank:2] [train], epoch: 23/50, iter: 700/834, loss: 0.32111, lr: 0.823958, top1: 0.60870, throughput: 312.68 | 2022-04-03 09:55:04.176 [rank:0] [train], epoch: 23/50, iter: 700/834, loss: 0.32101, lr: 0.823958, top1: 0.60937, throughput: 312.88 | 2022-04-03 09:55:04.185 [rank:1] [train], epoch: 23/50, iter: 800/834, loss: 0.32319, lr: 0.818186, top1: 0.60547, throughput: 311.96 | 2022-04-03 09:56:05.687 [rank:6] [train], epoch: 23/50, iter: 800/834, loss: 0.32537, lr: 0.818186, top1: 0.60234, throughput: 312.03 | 2022-04-03 09:56:05.697 [rank:3] [train], epoch: 23/50, iter: 800/834, loss: 0.32152, lr: 0.818186, top1: 0.60776, throughput: 311.88 | 2022-04-03 09:56:05.698 [rank:7] [train], epoch: 23/50, iter: 800/834, loss: 0.32451, lr: 0.818186, top1: 0.60385, throughput: 311.83 | 2022-04-03 09:56:05.715 [rank:2] [train], epoch: 23/50, iter: 800/834, loss: 0.32405, lr: 0.818186, top1: 0.60641, throughput: 311.94 | 2022-04-03 09:56:05.726 [rank:4] [train], epoch: 23/50, iter: 800/834, loss: 0.32255, lr: 0.818186, top1: 0.60359, throughput: 311.60 | 2022-04-03 09:56:05.730 [rank:0] [train], epoch: 23/50, iter: 800/834, loss: 0.32130, lr: 0.818186, top1: 0.61234, throughput: 311.79 | 2022-04-03 09:56:05.765 [rank:5] [train], epoch: 23/50, iter: 800/834, loss: 0.31864, lr: 0.818186, top1: 0.61568, throughput: 311.66 | 2022-04-03 09:56:05.778 [rank:7] [train], epoch: 23/50, iter: 834/834, loss: 0.32141, lr: 0.816223, top1: 0.60938, throughput: 311.44 | 2022-04-03 09:56:26.676 [rank:5] [train], epoch: 23/50, iter: 834/834, loss: 0.31803, lr: 0.816223, top1: 0.61229, throughput: 312.34 | 2022-04-03 09:56:26.678 [rank:1] [train], epoch: 23/50, iter: 834/834, loss: 0.31814, lr: 0.816223, top1: 0.61918, throughput: 310.99 | 2022-04-03 09:56:26.678 [rank:2] [train], epoch: 23/50, iter: 834/834, loss: 0.32144, lr: 0.816223, top1: 0.61489, throughput: 311.52 | 2022-04-03 09:56:26.681 [rank:0] [train], epoch: 23/50, iter: 834/834, loss: 0.32579, lr: 0.816223, top1: 0.60325, throughput: 312.04 | 2022-04-03 09:56:26.686 [rank:6] [train], epoch: 23/50, iter: 834/834, loss: 0.32220, lr: 0.816223, top1: 0.61091, throughput: 311.00 | 2022-04-03 09:56:26.687 [rank:4] [train], epoch: 23/50, iter: 834/834, loss: 0.31760, lr: 0.816223, top1: 0.62178, throughput: 311.49 | 2022-04-03 09:56:26.688 [rank:3] [train], epoch: 23/50, iter: 834/834, loss: 0.32406, lr: 0.816223, top1: 0.60738, throughput: 310.90 | 2022-04-03 09:56:26.695 [rank:0] [eval], epoch: 23/50, iter: 125/125, loss: 0.00000, lr: 0.816223, top1: 0.63824, throughput: 491.77 | 2022-04-03 09:56:39.395 [rank:2] [eval], epoch: 23/50, iter: 125/125, loss: 0.00000, lr: 0.816223, top1: 0.62880, throughput: 491.23 | 2022-04-03 09:56:39.404 [rank:1] [eval], epoch: 23/50, iter: 125/125, loss: 0.00000, lr: 0.816223, top1: 0.63456, throughput: 490.73 | 2022-04-03 09:56:39.414 [rank:7] [eval], epoch: 23/50, iter: 125/125, loss: 0.00000, lr: 0.816223, top1: 0.63888, throughput: 490.57 | 2022-04-03 09:56:39.416 [rank:3] [eval], epoch: 23/50, iter: 125/125, loss: 0.00000, lr: 0.816223, top1: 0.62928, throughput: 491.30 | 2022-04-03 09:56:39.417 [rank:5] [eval], epoch: 23/50, iter: 125/125, loss: 0.00000, lr: 0.816223, top1: 0.63152, throughput: 490.57 | 2022-04-03 09:56:39.418 [rank:6] [eval], epoch: 23/50, iter: 125/125, loss: 0.00000, lr: 0.816223, top1: 0.63648, throughput: 490.36 | 2022-04-03 09:56:39.432 [rank:4] [eval], epoch: 23/50, iter: 125/125, loss: 0.00000, lr: 0.816223, top1: 0.63376, throughput: 490.06 | 2022-04-03 09:56:39.441 [rank:1] [train], epoch: 24/50, iter: 100/834, loss: 0.31716, lr: 0.810447, top1: 0.61927, throughput: 312.39 | 2022-04-03 09:57:40.876 [rank:5] [train], epoch: 24/50, iter: 100/834, loss: 0.31928, lr: 0.810447, top1: 0.61083, throughput: 312.31 | 2022-04-03 09:57:40.897 [rank:3] [train], epoch: 24/50, iter: 100/834, loss: 0.31773, lr: 0.810447, top1: 0.61677, throughput: 312.27 | 2022-04-03 09:57:40.902 [rank:6] [train], epoch: 24/50, iter: 100/834, loss: 0.31502, lr: 0.810447, top1: 0.62609, throughput: 312.24 | 2022-04-03 09:57:40.924 [rank:2] [train], epoch: 24/50, iter: 100/834, loss: 0.31676, lr: 0.810447, top1: 0.61578, throughput: 312.07 | 2022-04-03 09:57:40.930 [rank:7] [train], epoch: 24/50, iter: 100/834, loss: 0.31665, lr: 0.810447, top1: 0.62047, throughput: 312.08 | 2022-04-03 09:57:40.939 [rank:4] [train], epoch: 24/50, iter: 100/834, loss: 0.31644, lr: 0.810447, top1: 0.61771, throughput: 312.16 | 2022-04-03 09:57:40.948 [rank:0] [train], epoch: 24/50, iter: 100/834, loss: 0.31612, lr: 0.810447, top1: 0.62016, throughput: 311.86 | 2022-04-03 09:57:40.960 [rank:2] [train], epoch: 24/50, iter: 200/834, loss: 0.31457, lr: 0.804669, top1: 0.62172, throughput: 310.80 | 2022-04-03 09:58:42.707 [rank:1] [train], epoch: 24/50, iter: 200/834, loss: 0.31516, lr: 0.804669, top1: 0.62156, throughput: 310.43 | 2022-04-03 09:58:42.725 [rank:6] [train], epoch: 24/50, iter: 200/834, loss: 0.31791, lr: 0.804669, top1: 0.61422, throughput: 310.57 | 2022-04-03 09:58:42.745 [rank:3] [train], epoch: 24/50, iter: 200/834, loss: 0.31700, lr: 0.804669, top1: 0.61318, throughput: 310.39 | 2022-04-03 09:58:42.759 [rank:4] [train], epoch: 24/50, iter: 200/834, loss: 0.31711, lr: 0.804669, top1: 0.61922, throughput: 310.63 | 2022-04-03 09:58:42.759 [rank:0] [train], epoch: 24/50, iter: 200/834, loss: 0.32059, lr: 0.804669, top1: 0.61203, throughput: 310.65 | 2022-04-03 09:58:42.765 [rank:7] [train], epoch: 24/50, iter: 200/834, loss: 0.31946, lr: 0.804669, top1: 0.61802, throughput: 310.55 | 2022-04-03 09:58:42.765 [rank:5] [train], epoch: 24/50, iter: 200/834, loss: 0.31902, lr: 0.804669, top1: 0.61547, throughput: 310.71 | 2022-04-03 09:58:42.690 [rank:3] [train], epoch: 24/50, iter: 300/834, loss: 0.31581, lr: 0.798889, top1: 0.61651, throughput: 313.25 | 2022-04-03 09:59:44.052 [rank:1] [train], epoch: 24/50, iter: 300/834, loss: 0.31580, lr: 0.798889, top1: 0.62380, throughput: 312.83 | 2022-04-03 09:59:44.101 [rank:6] [train], epoch: 24/50, iter: 300/834, loss: 0.31722, lr: 0.798889, top1: 0.61656, throughput: 312.91 | 2022-04-03 09:59:44.104 [rank:4] [train], epoch: 24/50, iter: 300/834, loss: 0.31956, lr: 0.798889, top1: 0.61781, throughput: 312.91 | 2022-04-03 09:59:44.120 [rank:5] [train], epoch: 24/50, iter: 300/834, loss: 0.31887, lr: 0.798889, top1: 0.61443, throughput: 312.54 | 2022-04-03 09:59:44.123 [rank:7] [train], epoch: 24/50, iter: 300/834, loss: 0.31855, lr: 0.798889, top1: 0.61609, throughput: 312.83 | 2022-04-03 09:59:44.141 [rank:0] [train], epoch: 24/50, iter: 300/834, loss: 0.31807, lr: 0.798889, top1: 0.61651, throughput: 312.79 | 2022-04-03 09:59:44.147 [rank:2] [train], epoch: 24/50, iter: 300/834, loss: 0.31849, lr: 0.798889, top1: 0.61776, throughput: 312.85 | 2022-04-03 09:59:44.079 [rank:7] [train], epoch: 24/50, iter: 400/834, loss: 0.31960, lr: 0.793107, top1: 0.61375, throughput: 312.68 | 2022-04-03 10:00:45.546 [rank:4] [train], epoch: 24/50, iter: 400/834, loss: 0.31909, lr: 0.793107, top1: 0.61604, throughput: 312.56 | 2022-04-03 10:00:45.548 [rank:2] [train], epoch: 24/50, iter: 400/834, loss: 0.31667, lr: 0.793107, top1: 0.61870, throughput: 312.34 | 2022-04-03 10:00:45.551 [rank:3] [train], epoch: 24/50, iter: 400/834, loss: 0.31855, lr: 0.793107, top1: 0.61578, throughput: 312.03 | 2022-04-03 10:00:45.584 [rank:1] [train], epoch: 24/50, iter: 400/834, loss: 0.32002, lr: 0.793107, top1: 0.61115, throughput: 312.27 | 2022-04-03 10:00:45.587 [rank:6] [train], epoch: 24/50, iter: 400/834, loss: 0.31942, lr: 0.793107, top1: 0.61557, throughput: 312.28 | 2022-04-03 10:00:45.588 [rank:5] [train], epoch: 24/50, iter: 400/834, loss: 0.31845, lr: 0.793107, top1: 0.61656, throughput: 312.34 | 2022-04-03 10:00:45.594 [rank:0] [train], epoch: 24/50, iter: 400/834, loss: 0.31736, lr: 0.793107, top1: 0.61703, throughput: 312.44 | 2022-04-03 10:00:45.598 [rank:5] [train], epoch: 24/50, iter: 500/834, loss: 0.31665, lr: 0.787323, top1: 0.61479, throughput: 313.49 | 2022-04-03 10:01:46.840 [rank:1] [train], epoch: 24/50, iter: 500/834, loss: 0.31626, lr: 0.787323, top1: 0.61672, throughput: 313.45 | 2022-04-03 10:01:46.841 [rank:7] [train], epoch: 24/50, iter: 500/834, loss: 0.31754, lr: 0.787323, top1: 0.61536, throughput: 313.20 | 2022-04-03 10:01:46.848 [rank:4] [train], epoch: 24/50, iter: 500/834, loss: 0.31774, lr: 0.787323, top1: 0.61589, throughput: 313.03 | 2022-04-03 10:01:46.883 [rank:6] [train], epoch: 24/50, iter: 500/834, loss: 0.31620, lr: 0.787323, top1: 0.61995, throughput: 313.17 | 2022-04-03 10:01:46.895 [rank:0] [train], epoch: 24/50, iter: 500/834, loss: 0.31798, lr: 0.787323, top1: 0.61620, throughput: 313.19 | 2022-04-03 10:01:46.903 [rank:3] [train], epoch: 24/50, iter: 500/834, loss: 0.31796, lr: 0.787323, top1: 0.61714, throughput: 313.08 | 2022-04-03 10:01:46.911 [rank:2] [train], epoch: 24/50, iter: 500/834, loss: 0.32218, lr: 0.787323, top1: 0.60953, throughput: 313.29 | 2022-04-03 10:01:46.837 [rank:5] [train], epoch: 24/50, iter: 600/834, loss: 0.32049, lr: 0.781538, top1: 0.60979, throughput: 312.41 | 2022-04-03 10:02:48.298 [rank:4] [train], epoch: 24/50, iter: 600/834, loss: 0.31851, lr: 0.781538, top1: 0.61187, throughput: 312.38 | 2022-04-03 10:02:48.347 [rank:1] [train], epoch: 24/50, iter: 600/834, loss: 0.32059, lr: 0.781538, top1: 0.61005, throughput: 312.13 | 2022-04-03 10:02:48.354 [rank:6] [train], epoch: 24/50, iter: 600/834, loss: 0.31918, lr: 0.781538, top1: 0.61177, throughput: 312.38 | 2022-04-03 10:02:48.360 [rank:2] [train], epoch: 24/50, iter: 600/834, loss: 0.32240, lr: 0.781538, top1: 0.60464, throughput: 312.04 | 2022-04-03 10:02:48.367 [rank:3] [train], epoch: 24/50, iter: 600/834, loss: 0.32072, lr: 0.781538, top1: 0.60870, throughput: 312.38 | 2022-04-03 10:02:48.375 [rank:0] [train], epoch: 24/50, iter: 600/834, loss: 0.32014, lr: 0.781538, top1: 0.60948, throughput: 312.32 | 2022-04-03 10:02:48.377 [rank:7] [train], epoch: 24/50, iter: 600/834, loss: 0.32061, lr: 0.781538, top1: 0.61073, throughput: 311.96 | 2022-04-03 10:02:48.394 [rank:2] [train], epoch: 24/50, iter: 700/834, loss: 0.31738, lr: 0.775753, top1: 0.62052, throughput: 313.64 | 2022-04-03 10:03:49.584 [rank:5] [train], epoch: 24/50, iter: 700/834, loss: 0.31904, lr: 0.775753, top1: 0.61422, throughput: 313.28 | 2022-04-03 10:03:49.585 [rank:7] [train], epoch: 24/50, iter: 700/834, loss: 0.31787, lr: 0.775753, top1: 0.61573, throughput: 313.70 | 2022-04-03 10:03:49.600 [rank:3] [train], epoch: 24/50, iter: 700/834, loss: 0.32042, lr: 0.775753, top1: 0.60823, throughput: 313.57 | 2022-04-03 10:03:49.606 [rank:4] [train], epoch: 24/50, iter: 700/834, loss: 0.31941, lr: 0.775753, top1: 0.61510, throughput: 313.40 | 2022-04-03 10:03:49.611 [rank:1] [train], epoch: 24/50, iter: 700/834, loss: 0.31762, lr: 0.775753, top1: 0.61604, throughput: 313.43 | 2022-04-03 10:03:49.611 [rank:6] [train], epoch: 24/50, iter: 700/834, loss: 0.31888, lr: 0.775753, top1: 0.61484, throughput: 313.80 | 2022-04-03 10:03:49.545 [rank:0] [train], epoch: 24/50, iter: 700/834, loss: 0.31847, lr: 0.775753, top1: 0.61708, throughput: 313.32 | 2022-04-03 10:03:49.657 [rank:1] [train], epoch: 24/50, iter: 800/834, loss: 0.31776, lr: 0.769967, top1: 0.61698, throughput: 313.13 | 2022-04-03 10:04:50.927 [rank:3] [train], epoch: 24/50, iter: 800/834, loss: 0.31918, lr: 0.769967, top1: 0.61479, throughput: 313.00 | 2022-04-03 10:04:50.947 [rank:0] [train], epoch: 24/50, iter: 800/834, loss: 0.32115, lr: 0.769967, top1: 0.61240, throughput: 313.25 | 2022-04-03 10:04:50.950 [rank:7] [train], epoch: 24/50, iter: 800/834, loss: 0.31938, lr: 0.769967, top1: 0.61438, throughput: 312.90 | 2022-04-03 10:04:50.962 [rank:5] [train], epoch: 24/50, iter: 800/834, loss: 0.31743, lr: 0.769967, top1: 0.61885, throughput: 312.81 | 2022-04-03 10:04:50.963 [rank:4] [train], epoch: 24/50, iter: 800/834, loss: 0.32106, lr: 0.769967, top1: 0.61219, throughput: 312.95 | 2022-04-03 10:04:50.963 [rank:6] [train], epoch: 24/50, iter: 800/834, loss: 0.32265, lr: 0.769967, top1: 0.60479, throughput: 312.46 | 2022-04-03 10:04:50.994 [rank:2] [train], epoch: 24/50, iter: 800/834, loss: 0.32052, lr: 0.769967, top1: 0.60786, throughput: 313.13 | 2022-04-03 10:04:50.901 [rank:2] [train], epoch: 24/50, iter: 834/834, loss: 0.32047, lr: 0.768000, top1: 0.61627, throughput: 313.74 | 2022-04-03 10:05:11.708 [rank:7] [train], epoch: 24/50, iter: 834/834, loss: 0.31638, lr: 0.768000, top1: 0.61719, throughput: 314.49 | 2022-04-03 10:05:11.720 [rank:4] [train], epoch: 24/50, iter: 834/834, loss: 0.32004, lr: 0.768000, top1: 0.61091, throughput: 314.48 | 2022-04-03 10:05:11.721 [rank:6] [train], epoch: 24/50, iter: 834/834, loss: 0.31906, lr: 0.768000, top1: 0.61336, throughput: 314.94 | 2022-04-03 10:05:11.722 [rank:1] [train], epoch: 24/50, iter: 834/834, loss: 0.32075, lr: 0.768000, top1: 0.61489, throughput: 313.91 | 2022-04-03 10:05:11.723 [rank:0] [train], epoch: 24/50, iter: 834/834, loss: 0.32118, lr: 0.768000, top1: 0.61060, throughput: 314.26 | 2022-04-03 10:05:11.722 [rank:3] [train], epoch: 24/50, iter: 834/834, loss: 0.31798, lr: 0.768000, top1: 0.61428, throughput: 314.17 | 2022-04-03 10:05:11.726 [rank:5] [train], epoch: 24/50, iter: 834/834, loss: 0.31704, lr: 0.768000, top1: 0.61657, throughput: 314.32 | 2022-04-03 10:05:11.732 [rank:0] [eval], epoch: 24/50, iter: 125/125, loss: 0.00000, lr: 0.768000, top1: 0.63392, throughput: 488.24 | 2022-04-03 10:05:24.523 [rank:2] [eval], epoch: 24/50, iter: 125/125, loss: 0.00000, lr: 0.768000, top1: 0.62064, throughput: 487.23 | 2022-04-03 10:05:24.536 [rank:1] [eval], epoch: 24/50, iter: 125/125, loss: 0.00000, lr: 0.768000, top1: 0.62352, throughput: 487.51 | 2022-04-03 10:05:24.543 [rank:7] [eval], epoch: 24/50, iter: 125/125, loss: 0.00000, lr: 0.768000, top1: 0.62528, throughput: 487.37 | 2022-04-03 10:05:24.544 [rank:3] [eval], epoch: 24/50, iter: 125/125, loss: 0.00000, lr: 0.768000, top1: 0.60896, throughput: 487.54 | 2022-04-03 10:05:24.546 [rank:5] [eval], epoch: 24/50, iter: 125/125, loss: 0.00000, lr: 0.768000, top1: 0.61696, throughput: 486.91[rank:6] [eval], epoch: 24/50, iter: 125/125, loss: 0.00000, lr: 0.768000, top1: 0.62112, throughput: 486.50 | 2022-04-03 10:05:24.568| 2022-04-03 10:05:24.569 [rank:4] [eval], epoch: 24/50, iter: 125/125, loss: 0.00000, lr: 0.768000, top1: 0.61536, throughput: 486.35 | 2022-04-03 10:05:24.571 [rank:1] [train], epoch: 25/50, iter: 100/834, loss: 0.31133, lr: 0.762214, top1: 0.63016, throughput: 313.25 | 2022-04-03 10:06:25.835 [rank:7] [train], epoch: 25/50, iter: 100/834, loss: 0.31139, lr: 0.762214, top1: 0.63005, throughput: 313.22 | 2022-04-03 10:06:25.844 [rank:6] [train], epoch: 25/50, iter: 100/834, loss: 0.31330, lr: 0.762214, top1: 0.62516, throughput: 313.27 | 2022-04-03 10:06:25.858 [rank:5] [train], epoch: 25/50, iter: 100/834, loss: 0.31144, lr: 0.762214, top1: 0.63177, throughput: 313.21 | 2022-04-03 10:06:25.870 [rank:4] [train], epoch: 25/50, iter: 100/834, loss: 0.31315, lr: 0.762214, top1: 0.62891, throughput: 313.22 | 2022-04-03 10:06:25.871 [rank:3] [train], epoch: 25/50, iter: 100/834, loss: 0.31328, lr: 0.762214, top1: 0.62693, throughput: 313.09 | 2022-04-03 10:06:25.871 [rank:0] [train], epoch: 25/50, iter: 100/834, loss: 0.31631, lr: 0.762214, top1: 0.61906, throughput: 312.94 | 2022-04-03 10:06:25.878 [rank:2] [train], epoch: 25/50, iter: 100/834, loss: 0.31331, lr: 0.762214, top1: 0.62589, throughput: 312.86 | 2022-04-03 10:06:25.905 [rank:4] [train], epoch: 25/50, iter: 200/834, loss: 0.31181, lr: 0.756429, top1: 0.62974, throughput: 310.98 | 2022-04-03 10:07:27.610 [rank:6] [train], epoch: 25/50, iter: 200/834, loss: 0.31301, lr: 0.756429, top1: 0.62953, throughput: 310.69 | 2022-04-03 10:07:27.655 [rank:5] [train], epoch: 25/50, iter: 200/834, loss: 0.31568, lr: 0.756429, top1: 0.62271, throughput: 310.74 | 2022-04-03 10:07:27.658 [rank:3] [train], epoch: 25/50, iter: 200/834, loss: 0.31298, lr: 0.756429, top1: 0.62620, throughput: 310.67 | 2022-04-03 10:07:27.673 [rank:1] [train], epoch: 25/50, iter: 200/834, loss: 0.31732, lr: 0.756429, top1: 0.61474, throughput: 310.37 | 2022-04-03 10:07:27.697 [rank:7] [train], epoch: 25/50, iter: 200/834, loss: 0.31403, lr: 0.756429, top1: 0.62542, throughput: 310.38 | 2022-04-03 10:07:27.704 [rank:0] [train], epoch: 25/50, iter: 200/834, loss: 0.31178, lr: 0.756429, top1: 0.62734, throughput: 310.44 | 2022-04-03 10:07:27.725 [rank:2] [train], epoch: 25/50, iter: 200/834, loss: 0.31261, lr: 0.756429, top1: 0.62422, throughput: 311.03 | 2022-04-03 10:07:27.635 [rank:7] [train], epoch: 25/50, iter: 300/834, loss: 0.31615, lr: 0.750644, top1: 0.62073, throughput: 313.12 | 2022-04-03 10:08:29.022 [rank:3] [train], epoch: 25/50, iter: 300/834, loss: 0.31136, lr: 0.750644, top1: 0.63000, throughput: 312.91 | 2022-04-03 10:08:29.032 [rank:0] [train], epoch: 25/50, iter: 300/834, loss: 0.31656, lr: 0.750644, top1: 0.62260, throughput: 313.15 | 2022-04-03 10:08:29.038 [rank:4] [train], epoch: 25/50, iter: 300/834, loss: 0.31597, lr: 0.750644, top1: 0.61969, throughput: 312.40 | 2022-04-03 10:08:29.070 [rank:1] [train], epoch: 25/50, iter: 300/834, loss: 0.31506, lr: 0.750644, top1: 0.62099, throughput: 312.81 | 2022-04-03 10:08:29.076 [rank:2] [train], epoch: 25/50, iter: 300/834, loss: 0.31547, lr: 0.750644, top1: 0.62026, throughput: 312.47 | 2022-04-03 10:08:29.082 [rank:6] [train], epoch: 25/50, iter: 300/834, loss: 0.31592, lr: 0.750644, top1: 0.61797, throughput: 312.94 | 2022-04-03 10:08:29.009 [rank:5] [train], epoch: 25/50, iter: 300/834, loss: 0.31603, lr: 0.750644, top1: 0.62052, throughput: 312.49 | 2022-04-03 10:08:29.100 [rank:2] [train], epoch: 25/50, iter: 400/834, loss: 0.31437, lr: 0.744860, top1: 0.62198, throughput: 310.44 | 2022-04-03 10:09:30.930 [rank:0] [train], epoch: 25/50, iter: 400/834, loss: 0.31662, lr: 0.744860, top1: 0.62167, throughput: 310.21 | 2022-04-03 10:09:30.931 [rank:6] [train], epoch: 25/50, iter: 400/834, loss: 0.31767, lr: 0.744860, top1: 0.61250, throughput: 309.95 | 2022-04-03 10:09:30.955 [rank:5] [train], epoch: 25/50, iter: 400/834, loss: 0.31663, lr: 0.744860, top1: 0.61760, throughput: 310.40 | 2022-04-03 10:09:30.956 [rank:3] [train], epoch: 25/50, iter: 400/834, loss: 0.31433, lr: 0.744860, top1: 0.62104, throughput: 310.02 | 2022-04-03 10:09:30.964 [rank:4] [train], epoch: 25/50, iter: 400/834, loss: 0.31621, lr: 0.744860, top1: 0.62177, throughput: 310.21 | 2022-04-03 10:09:30.965 [rank:7] [train], epoch: 25/50, iter: 400/834, loss: 0.31680, lr: 0.744860, top1: 0.61573, throughput: 309.88 | 2022-04-03 10:09:30.981 [rank:1] [train], epoch: 25/50, iter: 400/834, loss: 0.31638, lr: 0.744860, top1: 0.61797, throughput: 310.49 | 2022-04-03 10:09:30.914 [rank:5] [train], epoch: 25/50, iter: 500/834, loss: 0.31416, lr: 0.739077, top1: 0.62078, throughput: 312.87 | 2022-04-03 10:10:32.324 [rank:0] [train], epoch: 25/50, iter: 500/834, loss: 0.31623, lr: 0.739077, top1: 0.61849, throughput: 312.73 | 2022-04-03 10:10:32.325 [rank:7] [train], epoch: 25/50, iter: 500/834, loss: 0.31122, lr: 0.739077, top1: 0.62620, throughput: 312.78 | 2022-04-03 10:10:32.367 [rank:4] [train], epoch: 25/50, iter: 500/834, loss: 0.31661, lr: 0.739077, top1: 0.62219, throughput: 312.67 | 2022-04-03 10:10:32.372 [rank:6] [train], epoch: 25/50, iter: 500/834, loss: 0.31496, lr: 0.739077, top1: 0.62219, throughput: 312.60 | 2022-04-03 10:10:32.376 [rank:1] [train], epoch: 25/50, iter: 500/834, loss: 0.31509, lr: 0.739077, top1: 0.61667, throughput: 312.35 | 2022-04-03 10:10:32.385 [rank:3] [train], epoch: 25/50, iter: 500/834, loss: 0.31428, lr: 0.739077, top1: 0.62198, throughput: 312.58 | 2022-04-03 10:10:32.388 [rank:2] [train], epoch: 25/50, iter: 500/834, loss: 0.31667, lr: 0.739077, top1: 0.61984, throughput: 312.37 | 2022-04-03 10:10:32.395 [rank:1] [train], epoch: 25/50, iter: 600/834, loss: 0.31644, lr: 0.733296, top1: 0.61802, throughput: 314.43 | 2022-04-03 10:11:33.447 [rank:6] [train], epoch: 25/50, iter: 600/834, loss: 0.31568, lr: 0.733296, top1: 0.61635, throughput: 314.37 | 2022-04-03 10:11:33.452 [rank:7] [train], epoch: 25/50, iter: 600/834, loss: 0.31660, lr: 0.733296, top1: 0.61641, throughput: 314.30 | 2022-04-03 10:11:33.456 [rank:0] [train], epoch: 25/50, iter: 600/834, loss: 0.31563, lr: 0.733296, top1: 0.61953, throughput: 314.00 | 2022-04-03 10:11:33.472 [rank:3] [train], epoch: 25/50, iter: 600/834, loss: 0.31657, lr: 0.733296, top1: 0.61896, throughput: 314.13 | 2022-04-03 10:11:33.508 [rank:4] [train], epoch: 25/50, iter: 600/834, loss: 0.31788, lr: 0.733296, top1: 0.61521, throughput: 314.01 | 2022-04-03 10:11:33.516 [rank:2] [train], epoch: 25/50, iter: 600/834, loss: 0.31811, lr: 0.733296, top1: 0.61281, throughput: 314.07 | 2022-04-03 10:11:33.528 [rank:5] [train], epoch: 25/50, iter: 600/834, loss: 0.31271, lr: 0.733296, top1: 0.62255, throughput: 314.16 | 2022-04-03 10:11:33.438 [rank:1] [train], epoch: 25/50, iter: 700/834, loss: 0.31495, lr: 0.727517, top1: 0.62260, throughput: 313.90 | 2022-04-03 10:12:34.613 [rank:6] [train], epoch: 25/50, iter: 700/834, loss: 0.31560, lr: 0.727517, top1: 0.61760, throughput: 313.89 | 2022-04-03 10:12:34.619 [rank:0] [train], epoch: 25/50, iter: 700/834, loss: 0.31676, lr: 0.727517, top1: 0.61906, throughput: 313.89 | 2022-04-03 10:12:34.640 [rank:2] [train], epoch: 25/50, iter: 700/834, loss: 0.31723, lr: 0.727517, top1: 0.61615, throughput: 314.15 | 2022-04-03 10:12:34.644 [rank:5] [train], epoch: 25/50, iter: 700/834, loss: 0.31878, lr: 0.727517, top1: 0.61807, throughput: 313.60 | 2022-04-03 10:12:34.663 [rank:7] [train], epoch: 25/50, iter: 700/834, loss: 0.31500, lr: 0.727517, top1: 0.61953, throughput: 313.67 | 2022-04-03 10:12:34.667 [rank:4] [train], epoch: 25/50, iter: 700/834, loss: 0.31561, lr: 0.727517, top1: 0.62240, throughput: 313.94 | 2022-04-03 10:12:34.674 [rank:3] [train], epoch: 25/50, iter: 700/834, loss: 0.31629, lr: 0.727517, top1: 0.62000, throughput: 313.86 | 2022-04-03 10:12:34.682 [rank:3] [train], epoch: 25/50, iter: 800/834, loss: 0.31472, lr: 0.721740, top1: 0.62219, throughput: 313.35 | 2022-04-03 10:13:35.954 [rank:5] [train], epoch: 25/50, iter: 800/834, loss: 0.31740, lr: 0.721740, top1: 0.61688, throughput: 313.18 | 2022-04-03 10:13:35.969 [rank:7] [train], epoch: 25/50, iter: 800/834, loss: 0.31583, lr: 0.721740, top1: 0.62078, throughput: 313.19 | 2022-04-03 10:13:35.973 [rank:2] [train], epoch: 25/50, iter: 800/834, loss: 0.31516, lr: 0.721740, top1: 0.62411, throughput: 313.03 | 2022-04-03 10:13:35.979 [rank:1] [train], epoch: 25/50, iter: 800/834, loss: 0.31422, lr: 0.721740, top1: 0.62333, throughput: 312.87 | 2022-04-03 10:13:35.981 [rank:6] [train], epoch: 25/50, iter: 800/834, loss: 0.31332, lr: 0.721740, top1: 0.62391, throughput: 312.74 | 2022-04-03 10:13:36.012 [rank:0] [train], epoch: 25/50, iter: 800/834, loss: 0.31552, lr: 0.721740, top1: 0.61964, throughput: 312.84 | 2022-04-03 10:13:36.012 [rank:4] [train], epoch: 25/50, iter: 800/834, loss: 0.31858, lr: 0.721740, top1: 0.61641, throughput: 312.93 | 2022-04-03 10:13:36.031 [rank:5] [train], epoch: 25/50, iter: 834/834, loss: 0.31474, lr: 0.719777, top1: 0.62699, throughput: 309.35 | 2022-04-03 10:13:57.071 [rank:6] [train], epoch: 25/50, iter: 834/834, loss: 0.31915, lr: 0.719777, top1: 0.61336, throughput: 309.90 | 2022-04-03 10:13:57.077 [rank:0] [train], epoch: 25/50, iter: 834/834, loss: 0.30875, lr: 0.719777, top1: 0.63542, throughput: 309.86 | 2022-04-03 10:13:57.080 [rank:3] [train], epoch: 25/50, iter: 834/834, loss: 0.31746, lr: 0.719777, top1: 0.61290, throughput: 308.97 | 2022-04-03 10:13:57.082 [rank:2] [train], epoch: 25/50, iter: 834/834, loss: 0.31650, lr: 0.719777, top1: 0.61336, throughput: 309.25 | 2022-04-03 10:13:57.089 [rank:4] [train], epoch: 25/50, iter: 834/834, loss: 0.31989, lr: 0.719777, top1: 0.60922, throughput: 309.82 | 2022-04-03 10:13:57.101 [rank:1] [train], epoch: 25/50, iter: 834/834, loss: 0.31570, lr: 0.719777, top1: 0.62040, throughput: 309.08 | 2022-04-03 10:13:57.102 [rank:7] [train], epoch: 25/50, iter: 834/834, loss: 0.31944, lr: 0.719777, top1: 0.61443, throughput: 308.49 | 2022-04-03 10:13:57.134 [rank:1] [eval], epoch: 25/50, iter: 125/125, loss: 0.00000, lr: 0.719777, top1: 0.64704, throughput: 494.55 | 2022-04-03 10:14:09.739 [rank:0] [eval], epoch: 25/50, iter: 125/125, loss: 0.00000, lr: 0.719777, top1: 0.64864, throughput: 493.48 | 2022-04-03 10:14:09.745 [rank:2] [eval], epoch: 25/50, iter: 125/125, loss: 0.00000, lr: 0.719777, top1: 0.63952, throughput: 493.60 | 2022-04-03 10:14:09.751 [rank:4] [eval], epoch: 25/50, iter: 125/125, loss: 0.00000, lr: 0.719777, top1: 0.64160, throughput: 493.70 | 2022-04-03 10:14:09.761 [rank:7] [eval], epoch: 25/50, iter: 125/125, loss: 0.00000, lr: 0.719777, top1: 0.64768, throughput: 494.91 | 2022-04-03 10:14:09.763 [rank:6] [eval], epoch: 25/50, iter: 125/125, loss: 0.00000, lr: 0.719777, top1: 0.64176, throughput: 492.65 | 2022-04-03 10:14:09.763 [rank:3] [eval], epoch: 25/50, iter: 125/125, loss: 0.00000, lr: 0.719777, top1: 0.63968, throughput: 492.63 | 2022-04-03 10:14:09.769 [rank:5] [eval], epoch: 25/50, iter: 125/125, loss: 0.00000, lr: 0.719777, top1: 0.63056, throughput: 491.50 | 2022-04-03 10:14:09.788 [rank:2] [train], epoch: 26/50, iter: 100/834, loss: 0.30932, lr: 0.714004, top1: 0.63182, throughput: 311.96 | 2022-04-03 10:15:11.298 [rank:5] [train], epoch: 26/50, iter: 100/834, loss: 0.30976, lr: 0.714004, top1: 0.63370, throughput: 312.06 | 2022-04-03 10:15:11.315 [rank:0] [train], epoch: 26/50, iter: 100/834, loss: 0.30893, lr: 0.714004, top1: 0.63422, throughput: 311.83 | 2022-04-03 10:15:11.317 [rank:4] [train], epoch: 26/50, iter: 100/834, loss: 0.30963, lr: 0.714004, top1: 0.63099, throughput: 311.83 | 2022-04-03 10:15:11.333 [rank:1] [train], epoch: 26/50, iter: 100/834, loss: 0.31083, lr: 0.714004, top1: 0.62766, throughput: 311.67 | 2022-04-03 10:15:11.342 [rank:3] [train], epoch: 26/50, iter: 100/834, loss: 0.31048, lr: 0.714004, top1: 0.63260, throughput: 311.81 | 2022-04-03 10:15:11.346 [rank:7] [train], epoch: 26/50, iter: 100/834, loss: 0.30971, lr: 0.714004, top1: 0.63172, throughput: 311.74 | 2022-04-03 10:15:11.353 [rank:6] [train], epoch: 26/50, iter: 100/834, loss: 0.31279, lr: 0.714004, top1: 0.62521, throughput: 311.69 | 2022-04-03 10:15:11.363 [rank:3] [train], epoch: 26/50, iter: 200/834, loss: 0.30917, lr: 0.708234, top1: 0.63214, throughput: 313.35 | 2022-04-03 10:16:12.620 [rank:2] [train], epoch: 26/50, iter: 200/834, loss: 0.31051, lr: 0.708234, top1: 0.63047, throughput: 313.00 | 2022-04-03 10:16:12.641 [rank:4] [train], epoch: 26/50, iter: 200/834, loss: 0.31340, lr: 0.708234, top1: 0.62505, throughput: 313.17 | 2022-04-03 10:16:12.641 [rank:7] [train], epoch: 26/50, iter: 200/834, loss: 0.31072, lr: 0.708234, top1: 0.62708, throughput: 313.24 | 2022-04-03 10:16:12.648 [rank:5] [train], epoch: 26/50, iter: 200/834, loss: 0.31247, lr: 0.708234, top1: 0.62245, throughput: 313.03 | 2022-04-03 10:16:12.651 [rank:6] [train], epoch: 26/50, iter: 200/834, loss: 0.31177, lr: 0.708234, top1: 0.62734, throughput: 313.19 | 2022-04-03 10:16:12.667 [rank:1] [train], epoch: 26/50, iter: 200/834, loss: 0.31391, lr: 0.708234, top1: 0.61844, throughput: 313.02 | 2022-04-03 10:16:12.681 [rank:0] [train], epoch: 26/50, iter: 200/834, loss: 0.31182, lr: 0.708234, top1: 0.63068, throughput: 312.76 | 2022-04-03 10:16:12.706 [rank:6] [train], epoch: 26/50, iter: 300/834, loss: 0.31180, lr: 0.702467, top1: 0.62844, throughput: 311.96 | 2022-04-03 10:17:14.213 [rank:1] [train], epoch: 26/50, iter: 300/834, loss: 0.31216, lr: 0.702467, top1: 0.62880, throughput: 312.01 | 2022-04-03 10:17:14.218 [rank:5] [train], epoch: 26/50, iter: 300/834, loss: 0.30962, lr: 0.702467, top1: 0.63089, throughput: 311.83 | 2022-04-03 10:17:14.223 [rank:3] [train], epoch: 26/50, iter: 300/834, loss: 0.31098, lr: 0.702467, top1: 0.62833, throughput: 311.59 | 2022-04-03 10:17:14.238 [rank:0] [train], epoch: 26/50, iter: 300/834, loss: 0.31512, lr: 0.702467, top1: 0.62505, throughput: 312.00 | 2022-04-03 10:17:14.245 [rank:4] [train], epoch: 26/50, iter: 300/834, loss: 0.31496, lr: 0.702467, top1: 0.62714, throughput: 311.67 | 2022-04-03 10:17:14.245 [rank:2] [train], epoch: 26/50, iter: 300/834, loss: 0.31257, lr: 0.702467, top1: 0.62620, throughput: 311.54 | 2022-04-03 10:17:14.269 [rank:7] [train], epoch: 26/50, iter: 300/834, loss: 0.31180, lr: 0.702467, top1: 0.62313, throughput: 311.43 | 2022-04-03 10:17:14.299 [rank:5] [train], epoch: 26/50, iter: 400/834, loss: 0.31392, lr: 0.696704, top1: 0.62021, throughput: 313.30 | 2022-04-03 10:18:15.507 [rank:4] [train], epoch: 26/50, iter: 400/834, loss: 0.31217, lr: 0.696704, top1: 0.62448, throughput: 313.32 | 2022-04-03 10:18:15.525 [rank:2] [train], epoch: 26/50, iter: 400/834, loss: 0.31291, lr: 0.696704, top1: 0.62349, throughput: 313.41 | 2022-04-03 10:18:15.532 [rank:0] [train], epoch: 26/50, iter: 400/834, loss: 0.31317, lr: 0.696704, top1: 0.62516, throughput: 313.20 | 2022-04-03 10:18:15.548 [rank:7] [train], epoch: 26/50, iter: 400/834, loss: 0.31551, lr: 0.696704, top1: 0.62141, throughput: 313.47 | 2022-04-03 10:18:15.549 [rank:1] [train], epoch: 26/50, iter: 400/834, loss: 0.31190, lr: 0.696704, top1: 0.62500, throughput: 313.02 | 2022-04-03 10:18:15.556 [rank:6] [train], epoch: 26/50, iter: 400/834, loss: 0.31137, lr: 0.696704, top1: 0.63073, throughput: 312.92 | 2022-04-03 10:18:15.570 [rank:3] [train], epoch: 26/50, iter: 400/834, loss: 0.31493, lr: 0.696704, top1: 0.61792, throughput: 312.99 | 2022-04-03 10:18:15.581 [rank:3] [train], epoch: 26/50, iter: 500/834, loss: 0.31299, lr: 0.690945, top1: 0.62615, throughput: 313.65 | 2022-04-03 10:19:16.797 [rank:6] [train], epoch: 26/50, iter: 500/834, loss: 0.31212, lr: 0.690945, top1: 0.62516, throughput: 313.53 | 2022-04-03 10:19:16.809 [rank:0] [train], epoch: 26/50, iter: 500/834, loss: 0.31138, lr: 0.690945, top1: 0.62849, throughput: 313.31 | 2022-04-03 10:19:16.829 [rank:1] [train], epoch: 26/50, iter: 500/834, loss: 0.31787, lr: 0.690945, top1: 0.61656, throughput: 313.28 | 2022-04-03 10:19:16.843 [rank:2] [train], epoch: 26/50, iter: 500/834, loss: 0.31009, lr: 0.690945, top1: 0.62849, throughput: 313.45 | 2022-04-03 10:19:16.786 [rank:5] [train], epoch: 26/50, iter: 500/834, loss: 0.31488, lr: 0.690945, top1: 0.62401, throughput: 312.86 | 2022-04-03 10:19:16.877 [rank:4] [train], epoch: 26/50, iter: 500/834, loss: 0.31401, lr: 0.690945, top1: 0.62391, throughput: 312.86 | 2022-04-03 10:19:16.894 [rank:7] [train], epoch: 26/50, iter: 500/834, loss: 0.31435, lr: 0.690945, top1: 0.62255, throughput: 313.48 | 2022-04-03 10:19:16.796 [rank:7] [train], epoch: 26/50, iter: 600/834, loss: 0.31433, lr: 0.685191, top1: 0.62167, throughput: 312.45 | 2022-04-03 10:20:18.245 [rank:2] [train], epoch: 26/50, iter: 600/834, loss: 0.31439, lr: 0.685191, top1: 0.62198, throughput: 312.34 | 2022-04-03 10:20:18.258 [rank:1] [train], epoch: 26/50, iter: 600/834, loss: 0.31365, lr: 0.685191, top1: 0.62573, throughput: 312.58 | 2022-04-03 10:20:18.266 [rank:3] [train], epoch: 26/50, iter: 600/834, loss: 0.30929, lr: 0.685191, top1: 0.63104, throughput: 312.26 | 2022-04-03 10:20:18.283 [rank:0] [train], epoch: 26/50, iter: 600/834, loss: 0.31509, lr: 0.685191, top1: 0.62104, throughput: 312.39 | 2022-04-03 10:20:18.291 [rank:6] [train], epoch: 26/50, iter: 600/834, loss: 0.31326, lr: 0.685191, top1: 0.62438, throughput: 312.15 | 2022-04-03 10:20:18.318 [rank:5] [train], epoch: 26/50, iter: 600/834, loss: 0.31159, lr: 0.685191, top1: 0.62677, throughput: 312.43 | 2022-04-03 10:20:18.330 [rank:4] [train], epoch: 26/50, iter: 600/834, loss: 0.30946, lr: 0.685191, top1: 0.63120, throughput: 312.43 | 2022-04-03 10:20:18.347 [rank:2] [train], epoch: 26/50, iter: 700/834, loss: 0.31108, lr: 0.679441, top1: 0.62776, throughput: 312.25 | 2022-04-03 10:21:19.747 [rank:3] [train], epoch: 26/50, iter: 700/834, loss: 0.31290, lr: 0.679441, top1: 0.62495, throughput: 312.35 | 2022-04-03 10:21:19.753 [rank:7] [train], epoch: 26/50, iter: 700/834, loss: 0.31193, lr: 0.679441, top1: 0.62547, throughput: 312.01 | 2022-04-03 10:21:19.781 [rank:0] [train], epoch: 26/50, iter: 700/834, loss: 0.31348, lr: 0.679441, top1: 0.61896, throughput: 312.21 | 2022-04-03 10:21:19.787 [rank:1] [train], epoch: 26/50, iter: 700/834, loss: 0.31369, lr: 0.679441, top1: 0.61776, throughput: 312.07 | 2022-04-03 10:21:19.791 [rank:6] [train], epoch: 26/50, iter: 700/834, loss: 0.31070, lr: 0.679441, top1: 0.63057, throughput: 312.29 | 2022-04-03 10:21:19.800 [rank:4] [train], epoch: 26/50, iter: 700/834, loss: 0.31246, lr: 0.679441, top1: 0.62521, throughput: 312.31 | 2022-04-03 10:21:19.824 [rank:5] [train], epoch: 26/50, iter: 700/834, loss: 0.31467, lr: 0.679441, top1: 0.62437, throughput: 312.22 | 2022-04-03 10:21:19.824 [rank:4] [train], epoch: 26/50, iter: 800/834, loss: 0.31087, lr: 0.673696, top1: 0.62849, throughput: 314.17 | 2022-04-03 10:22:20.938 [rank:7] [train], epoch: 26/50, iter: 800/834, loss: 0.31621, lr: 0.673696, top1: 0.62333, throughput: 313.92 | 2022-04-03 10:22:20.942 [rank:6] [train], epoch: 26/50, iter: 800/834, loss: 0.31486, lr: 0.673696, top1: 0.62073, throughput: 313.92 | 2022-04-03 10:22:20.962 [rank:3] [train], epoch: 26/50, iter: 800/834, loss: 0.31253, lr: 0.673696, top1: 0.62094, throughput: 313.61 | 2022-04-03 10:22:20.975 [rank:2] [train], epoch: 26/50, iter: 800/834, loss: 0.31460, lr: 0.673696, top1: 0.62172, throughput: 313.58 | 2022-04-03 10:22:20.976 [rank:0] [train], epoch: 26/50, iter: 800/834, loss: 0.31478, lr: 0.673696, top1: 0.62375, throughput: 313.69 | 2022-04-03 10:22:20.994 [rank:5] [train], epoch: 26/50, iter: 800/834, loss: 0.31188, lr: 0.673696, top1: 0.62688, throughput: 313.87 | 2022-04-03 10:22:20.995 [rank:1] [train], epoch: 26/50, iter: 800/834, loss: 0.31278, lr: 0.673696, top1: 0.62521, throughput: 314.09 | 2022-04-03 10:22:20.920 [rank:5] [train], epoch: 26/50, iter: 834/834, loss: 0.31358, lr: 0.671744, top1: 0.61903, throughput: 313.34 | 2022-04-03 10:22:41.829 [rank:3] [train], epoch: 26/50, iter: 834/834, loss: 0.31091, lr: 0.671744, top1: 0.62714, throughput: 313.03 | 2022-04-03 10:22:41.830 [rank:7] [train], epoch: 26/50, iter: 834/834, loss: 0.31063, lr: 0.671744, top1: 0.63358, throughput: 312.48 | 2022-04-03 10:22:41.833 [rank:2] [train], epoch: 26/50, iter: 834/834, loss: 0.30912, lr: 0.671744, top1: 0.63251, throughput: 312.98 | 2022-04-03 10:22:41.833 [rank:6] [train], epoch: 26/50, iter: 834/834, loss: 0.31715, lr: 0.671744, top1: 0.61366, throughput: 312.72 | 2022-04-03 10:22:41.836 [rank:4] [train], epoch: 26/50, iter: 834/834, loss: 0.31722, lr: 0.671744, top1: 0.61734, throughput: 312.34 | 2022-04-03 10:22:41.838 [rank:0] [train], epoch: 26/50, iter: 834/834, loss: 0.31541, lr: 0.671744, top1: 0.62102, throughput: 313.11 | 2022-04-03 10:22:41.843 [rank:1] [train], epoch: 26/50, iter: 834/834, loss: 0.30966, lr: 0.671744, top1: 0.63143, throughput: 311.47 | 2022-04-03 10:22:41.878 [rank:0] [eval], epoch: 26/50, iter: 125/125, loss: 0.00000, lr: 0.671744, top1: 0.63280, throughput: 483.59 | 2022-04-03 10:22:54.767 [rank:1] [eval], epoch: 26/50, iter: 125/125, loss: 0.00000, lr: 0.671744, top1: 0.63136, throughput: 484.74 | 2022-04-03 10:22:54.772 [rank:2] [eval], epoch: 26/50, iter: 125/125, loss: 0.00000, lr: 0.671744, top1: 0.62256, throughput: 482.95 | 2022-04-03 10:22:54.775 [rank:3] [eval], epoch: 26/50, iter: 125/125, loss: 0.00000, lr: 0.671744, top1: 0.62112, throughput: 482.50 | 2022-04-03 10:22:54.783 [rank:7] [eval], epoch: 26/50, iter: 125/125, loss: 0.00000, lr: 0.671744, top1: 0.63424, throughput: 482.23 | 2022-04-03 10:22:54.794 [rank:6] [eval], epoch: 26/50, iter: 125/125, loss: 0.00000, lr: 0.671744, top1: 0.62848, throughput: 481.51 | 2022-04-03 10:22:54.817 [rank:4] [eval], epoch: 26/50, iter: 125/125, loss: 0.00000, lr: 0.671744, top1: 0.62720, throughput: 481.50 | 2022-04-03 10:22:54.818 [rank:5] [eval], epoch: 26/50, iter: 125/125, loss: 0.00000, lr: 0.671744, top1: 0.62048, throughput: 480.13 | 2022-04-03 10:22:54.846 [rank:3] [train], epoch: 27/50, iter: 100/834, loss: 0.30790, lr: 0.666007, top1: 0.63573, throughput: 312.77 | 2022-04-03 10:23:56.171 [rank:5] [train], epoch: 27/50, iter: 100/834, loss: 0.30747, lr: 0.666007, top1: 0.63437, throughput: 313.04 | 2022-04-03 10:23:56.180 [rank:6] [train], epoch: 27/50, iter: 100/834, loss: 0.30614, lr: 0.666007, top1: 0.63917, throughput: 312.81 | 2022-04-03 10:23:56.195 [rank:4] [train], epoch: 27/50, iter: 100/834, loss: 0.30771, lr: 0.666007, top1: 0.63854, throughput: 312.75 | 2022-04-03 10:23:56.209 [rank:1] [train], epoch: 27/50, iter: 100/834, loss: 0.30952, lr: 0.666007, top1: 0.62938, throughput: 312.51 | 2022-04-03 10:23:56.209 [rank:2] [train], epoch: 27/50, iter: 100/834, loss: 0.30727, lr: 0.666007, top1: 0.63693, throughput: 312.52 | 2022-04-03 10:23:56.211 [rank:0] [train], epoch: 27/50, iter: 100/834, loss: 0.31012, lr: 0.666007, top1: 0.63000, throughput: 312.42 | 2022-04-03 10:23:56.222 [rank:7] [train], epoch: 27/50, iter: 100/834, loss: 0.30567, lr: 0.666007, top1: 0.64104, throughput: 312.49 | 2022-04-03 10:23:56.237 [rank:5] [train], epoch: 27/50, iter: 200/834, loss: 0.30770, lr: 0.660275, top1: 0.63370, throughput: 312.65 | 2022-04-03 10:24:57.591 [rank:7] [train], epoch: 27/50, iter: 200/834, loss: 0.30688, lr: 0.660275, top1: 0.63635, throughput: 312.70 | 2022-04-03 10:24:57.638 [rank:4] [train], epoch: 27/50, iter: 200/834, loss: 0.30762, lr: 0.660275, top1: 0.63672, throughput: 312.55 | 2022-04-03 10:24:57.639 [rank:2] [train], epoch: 27/50, iter: 200/834, loss: 0.31054, lr: 0.660275, top1: 0.63073, throughput: 312.49 | 2022-04-03 10:24:57.652 [rank:3] [train], epoch: 27/50, iter: 200/834, loss: 0.30993, lr: 0.660275, top1: 0.63094, throughput: 312.29 | 2022-04-03 10:24:57.652 [rank:6] [train], epoch: 27/50, iter: 200/834, loss: 0.31039, lr: 0.660275, top1: 0.63005, throughput: 312.32 | 2022-04-03 10:24:57.671 [rank:0] [train], epoch: 27/50, iter: 200/834, loss: 0.30614, lr: 0.660275, top1: 0.64000, throughput: 312.41 | 2022-04-03 10:24:57.680 [rank:1] [train], epoch: 27/50, iter: 200/834, loss: 0.30569, lr: 0.660275, top1: 0.63375, throughput: 312.81 | 2022-04-03 10:24:57.587 [rank:6] [train], epoch: 27/50, iter: 300/834, loss: 0.30895, lr: 0.654549, top1: 0.62990, throughput: 311.53 | 2022-04-03 10:25:59.303 [rank:0] [train], epoch: 27/50, iter: 300/834, loss: 0.30849, lr: 0.654549, top1: 0.62901, throughput: 311.55 | 2022-04-03 10:25:59.307 [rank:1] [train], epoch: 27/50, iter: 300/834, loss: 0.30954, lr: 0.654549, top1: 0.63177, throughput: 310.91 | 2022-04-03 10:25:59.341 [rank:5] [train], epoch: 27/50, iter: 300/834, loss: 0.30814, lr: 0.654549, top1: 0.63510, throughput: 310.90 | 2022-04-03 10:25:59.348 [rank:4] [train], epoch: 27/50, iter: 300/834, loss: 0.30782, lr: 0.654549, top1: 0.63578, throughput: 311.10 | 2022-04-03 10:25:59.355 [rank:2] [train], epoch: 27/50, iter: 300/834, loss: 0.30859, lr: 0.654549, top1: 0.63323, throughput: 311.17 | 2022-04-03 10:25:59.355 [rank:7] [train], epoch: 27/50, iter: 300/834, loss: 0.30726, lr: 0.654549, top1: 0.63714, throughput: 310.97 | 2022-04-03 10:25:59.379 [rank:3] [train], epoch: 27/50, iter: 300/834, loss: 0.31146, lr: 0.654549, top1: 0.63286, throughput: 311.03 | 2022-04-03 10:25:59.382 [rank:6] [train], epoch: 27/50, iter: 400/834, loss: 0.30918, lr: 0.648830, top1: 0.62625, throughput: 311.74 | 2022-04-03 10:27:00.893 [rank:7] [train], epoch: 27/50, iter: 400/834, loss: 0.30655, lr: 0.648830, top1: 0.63208, throughput: 312.13 | 2022-04-03 10:27:00.893 [rank:4] [train], epoch: 27/50, iter: 400/834, loss: 0.30948, lr: 0.648830, top1: 0.62969, throughput: 311.95 | 2022-04-03 10:27:00.903 [rank:3] [train], epoch: 27/50, iter: 400/834, loss: 0.30941, lr: 0.648830, top1: 0.63130, throughput: 312.06 | 2022-04-03 10:27:00.909 [rank:1] [train], epoch: 27/50, iter: 400/834, loss: 0.30714, lr: 0.648830, top1: 0.63750, throughput: 311.83 | 2022-04-03 10:27:00.913 [rank:0] [train], epoch: 27/50, iter: 400/834, loss: 0.30910, lr: 0.648830, top1: 0.62823, throughput: 311.63 | 2022-04-03 10:27:00.918 [rank:5] [train], epoch: 27/50, iter: 400/834, loss: 0.30685, lr: 0.648830, top1: 0.63677, throughput: 311.83 | 2022-04-03 10:27:00.919 [rank:2] [train], epoch: 27/50, iter: 400/834, loss: 0.30907, lr: 0.648830, top1: 0.63438, throughput: 311.87 | 2022-04-03 10:27:00.919 [rank:1] [train], epoch: 27/50, iter: 500/834, loss: 0.30839, lr: 0.643117, top1: 0.63250, throughput: 314.53 | 2022-04-03 10:28:01.956 [rank:0] [train], epoch: 27/50, iter: 500/834, loss: 0.31152, lr: 0.643117, top1: 0.62620, throughput: 314.35 | 2022-04-03 10:28:01.997 [rank:6] [train], epoch: 27/50, iter: 500/834, loss: 0.30925, lr: 0.643117, top1: 0.63161, throughput: 314.19 | 2022-04-03 10:28:02.002 [rank:7] [train], epoch: 27/50, iter: 500/834, loss: 0.30782, lr: 0.643117, top1: 0.63615, throughput: 314.13 | 2022-04-03 10:28:02.015 [rank:2] [train], epoch: 27/50, iter: 500/834, loss: 0.31011, lr: 0.643117, top1: 0.62458, throughput: 314.23 | 2022-04-03 10:28:02.021 [rank:4] [train], epoch: 27/50, iter: 500/834, loss: 0.30884, lr: 0.643117, top1: 0.63401, throughput: 314.12 | 2022-04-03 10:28:02.027 [rank:5] [train], epoch: 27/50, iter: 500/834, loss: 0.30937, lr: 0.643117, top1: 0.63021, throughput: 314.18 | 2022-04-03 10:28:02.030 [rank:3] [train], epoch: 27/50, iter: 500/834, loss: 0.31109, lr: 0.643117, top1: 0.62677, throughput: 314.11 | 2022-04-03 10:28:02.033 [rank:6] [train], epoch: 27/50, iter: 600/834, loss: 0.30964, lr: 0.637412, top1: 0.62990, throughput: 312.64 | 2022-04-03 10:29:03.414 [rank:7] [train], epoch: 27/50, iter: 600/834, loss: 0.31210, lr: 0.637412, top1: 0.62453, throughput: 312.55 | 2022-04-03 10:29:03.446 [rank:0] [train], epoch: 27/50, iter: 600/834, loss: 0.31142, lr: 0.637412, top1: 0.62547, throughput: 312.45 | 2022-04-03 10:29:03.446 [rank:3] [train], epoch: 27/50, iter: 600/834, loss: 0.31050, lr: 0.637412, top1: 0.62792, throughput: 313.00 | 2022-04-03 10:29:03.374 [rank:1] [train], epoch: 27/50, iter: 600/834, loss: 0.31282, lr: 0.637412, top1: 0.62333, throughput: 312.15 | 2022-04-03 10:29:03.464 [rank:2] [train], epoch: 27/50, iter: 600/834, loss: 0.30737, lr: 0.637412, top1: 0.63500, throughput: 312.34 | 2022-04-03 10:29:03.493 [rank:5] [train], epoch: 27/50, iter: 600/834, loss: 0.31054, lr: 0.637412, top1: 0.63047, throughput: 312.29 | 2022-04-03 10:29:03.512 [rank:4] [train], epoch: 27/50, iter: 600/834, loss: 0.30915, lr: 0.637412, top1: 0.63365, throughput: 312.53 | 2022-04-03 10:29:03.460 [rank:5] [train], epoch: 27/50, iter: 700/834, loss: 0.30883, lr: 0.631714, top1: 0.63563, throughput: 311.43 | 2022-04-03 10:30:05.163 [rank:1] [train], epoch: 27/50, iter: 700/834, loss: 0.30769, lr: 0.631714, top1: 0.63484, throughput: 311.01 | 2022-04-03 10:30:05.199 [rank:7] [train], epoch: 27/50, iter: 700/834, loss: 0.30893, lr: 0.631714, top1: 0.63406, throughput: 310.88 | 2022-04-03 10:30:05.206 [rank:2] [train], epoch: 27/50, iter: 700/834, loss: 0.30700, lr: 0.631714, top1: 0.63896, throughput: 311.09 | 2022-04-03 10:30:05.211 [rank:0] [train], epoch: 27/50, iter: 700/834, loss: 0.31140, lr: 0.631714, top1: 0.62880, throughput: 310.84 | 2022-04-03 10:30:05.215 [rank:3] [train], epoch: 27/50, iter: 700/834, loss: 0.30746, lr: 0.631714, top1: 0.63771, throughput: 310.42 | 2022-04-03 10:30:05.225 [rank:4] [train], epoch: 27/50, iter: 700/834, loss: 0.31199, lr: 0.631714, top1: 0.62833, throughput: 310.75 | 2022-04-03 10:30:05.245 [rank:6] [train], epoch: 27/50, iter: 700/834, loss: 0.31341, lr: 0.631714, top1: 0.62141, throughput: 310.46 | 2022-04-03 10:30:05.257 [rank:6] [train], epoch: 27/50, iter: 800/834, loss: 0.30666, lr: 0.626024, top1: 0.63880, throughput: 312.55 | 2022-04-03 10:31:06.688 [rank:2] [train], epoch: 27/50, iter: 800/834, loss: 0.30987, lr: 0.626024, top1: 0.62630, throughput: 312.18 | 2022-04-03 10:31:06.714 [rank:7] [train], epoch: 27/50, iter: 800/834, loss: 0.30947, lr: 0.626024, top1: 0.63318, throughput: 312.13 | 2022-04-03 10:31:06.718 [rank:3] [train], epoch: 27/50, iter: 800/834, loss: 0.31163, lr: 0.626024, top1: 0.62719, throughput: 312.09 | 2022-04-03 10:31:06.746 [rank:4] [train], epoch: 27/50, iter: 800/834, loss: 0.31021, lr: 0.626024, top1: 0.63240, throughput: 312.18 | 2022-04-03 10:31:06.748 [rank:5] [train], epoch: 27/50, iter: 800/834, loss: 0.31113, lr: 0.626024, top1: 0.62880, throughput: 311.70 | 2022-04-03 10:31:06.761 [rank:0] [train], epoch: 27/50, iter: 800/834, loss: 0.31030, lr: 0.626024, top1: 0.63266, throughput: 311.93 | 2022-04-03 10:31:06.768 [rank:1] [train], epoch: 27/50, iter: 800/834, loss: 0.30870, lr: 0.626024, top1: 0.62885, throughput: 311.80 | 2022-04-03 10:31:06.776 [rank:5] [train], epoch: 27/50, iter: 834/834, loss: 0.30892, lr: 0.624091, top1: 0.63496, throughput: 315.03 | 2022-04-03 10:31:27.483 [rank:6] [train], epoch: 27/50, iter: 834/834, loss: 0.30971, lr: 0.624091, top1: 0.62531, throughput: 313.55 | 2022-04-03 10:31:27.507 [rank:1] [train], epoch: 27/50, iter: 834/834, loss: 0.30831, lr: 0.624091, top1: 0.63986, throughput: 314.83 | 2022-04-03 10:31:27.511 [rank:7] [train], epoch: 27/50, iter: 834/834, loss: 0.31522, lr: 0.624091, top1: 0.62362, throughput: 313.92 | 2022-04-03 10:31:27.513 [rank:4] [train], epoch: 27/50, iter: 834/834, loss: 0.30803, lr: 0.624091, top1: 0.63082, throughput: 314.32 | 2022-04-03 10:31:27.517 [rank:2] [train], epoch: 27/50, iter: 834/834, loss: 0.30812, lr: 0.624091, top1: 0.62975, throughput: 313.63 | 2022-04-03 10:31:27.529 [rank:3] [train], epoch: 27/50, iter: 834/834, loss: 0.31480, lr: 0.624091, top1: 0.62960, throughput: 313.86 | 2022-04-03 10:31:27.545 [rank:0] [train], epoch: 27/50, iter: 834/834, loss: 0.31017, lr: 0.624091, top1: 0.63542, throughput: 313.94 | 2022-04-03 10:31:27.561 [rank:1] [eval], epoch: 27/50, iter: 125/125, loss: 0.00000, lr: 0.624091, top1: 0.65728, throughput: 480.54 | 2022-04-03 10:31:40.517 [rank:0] [eval], epoch: 27/50, iter: 125/125, loss: 0.00000, lr: 0.624091, top1: 0.66288, throughput: 482.39 | 2022-04-03 10:31:40.518 [rank:2] [eval], epoch: 27/50, iter: 125/125, loss: 0.00000, lr: 0.624091, top1: 0.66000, throughput: 480.81 | 2022-04-03 10:31:40.528 [rank:3] [eval], epoch: 27/50, iter: 125/125, loss: 0.00000, lr: 0.624091, top1: 0.65296, throughput: 481.26 | 2022-04-03 10:31:40.532 [rank:5] [eval], epoch: 27/50, iter: 125/125, loss: 0.00000, lr: 0.624091, top1: 0.64912, throughput: 478.68 | 2022-04-03 10:31:40.540 [rank:7] [eval], epoch: 27/50, iter: 125/125, loss: 0.00000, lr: 0.624091, top1: 0.66592, throughput: 479.75 | 2022-04-03 10:31:40.540 [rank:4] [eval], epoch: 27/50, iter: 125/125, loss: 0.00000, lr: 0.624091, top1: 0.65328, throughput: 478.82 | 2022-04-03 10:31:40.570 [rank:6] [eval], epoch: 27/50, iter: 125/125, loss: 0.00000, lr: 0.624091, top1: 0.65760, throughput: 478.35 | 2022-04-03 10:31:40.573 [rank:1] [train], epoch: 28/50, iter: 100/834, loss: 0.30506, lr: 0.618412, top1: 0.64026, throughput: 313.21 | 2022-04-03 10:32:41.818 [rank:7] [train], epoch: 28/50, iter: 100/834, loss: 0.30508, lr: 0.618412, top1: 0.64177, throughput: 312.92 | 2022-04-03 10:32:41.898 [rank:4] [train], epoch: 28/50, iter: 100/834, loss: 0.30445, lr: 0.618412, top1: 0.64203, throughput: 313.03 | 2022-04-03 10:32:41.907 [rank:5] [train], epoch: 28/50, iter: 100/834, loss: 0.30052, lr: 0.618412, top1: 0.65021, throughput: 312.81 | 2022-04-03 10:32:41.918 [rank:0] [train], epoch: 28/50, iter: 100/834, loss: 0.30464, lr: 0.618412, top1: 0.63948, throughput: 312.69 | 2022-04-03 10:32:41.921 [rank:6] [train], epoch: 28/50, iter: 100/834, loss: 0.30404, lr: 0.618412, top1: 0.64031, throughput: 312.94 | 2022-04-03 10:32:41.926 [rank:3] [train], epoch: 28/50, iter: 100/834, loss: 0.29982, lr: 0.618412, top1: 0.65120, throughput: 312.70 | 2022-04-03 10:32:41.932 [rank:2] [train], epoch: 28/50, iter: 100/834, loss: 0.30537, lr: 0.618412, top1: 0.63682, throughput: 312.68 | 2022-04-03 10:32:41.932 [rank:0] [train], epoch: 28/50, iter: 200/834, loss: 0.30731, lr: 0.612741, top1: 0.63526, throughput: 311.37 | 2022-04-03 10:33:43.584 [rank:5] [train], epoch: 28/50, iter: 200/834, loss: 0.30278, lr: 0.612741, top1: 0.64604, throughput: 311.26 | 2022-04-03 10:33:43.603 [rank:2] [train], epoch: 28/50, iter: 200/834, loss: 0.30458, lr: 0.612741, top1: 0.63880, throughput: 311.33 | 2022-04-03 10:33:43.603 [rank:3] [train], epoch: 28/50, iter: 200/834, loss: 0.30486, lr: 0.612741, top1: 0.64318, throughput: 311.27 | 2022-04-03 10:33:43.615 [rank:1] [train], epoch: 28/50, iter: 200/834, loss: 0.30590, lr: 0.612741, top1: 0.63719, throughput: 310.69 | 2022-04-03 10:33:43.616 [rank:7] [train], epoch: 28/50, iter: 200/834, loss: 0.31011, lr: 0.612741, top1: 0.63141, throughput: 311.09 | 2022-04-03 10:33:43.616 [rank:4] [train], epoch: 28/50, iter: 200/834, loss: 0.30296, lr: 0.612741, top1: 0.64354, throughput: 311.11 | 2022-04-03 10:33:43.622 [rank:6] [train], epoch: 28/50, iter: 200/834, loss: 0.30661, lr: 0.612741, top1: 0.63880, throughput: 311.18 | 2022-04-03 10:33:43.627 [rank:5] [train], epoch: 28/50, iter: 300/834, loss: 0.30569, lr: 0.607079, top1: 0.63891, throughput: 312.79 | 2022-04-03 10:34:44.986 [rank:1] [train], epoch: 28/50, iter: 300/834, loss: 0.30746, lr: 0.607079, top1: 0.63615, throughput: 312.69 | 2022-04-03 10:34:45.018 [rank:3] [train], epoch: 28/50, iter: 300/834, loss: 0.30700, lr: 0.607079, top1: 0.63953, throughput: 312.64 | 2022-04-03 10:34:45.028 [rank:2] [train], epoch: 28/50, iter: 300/834, loss: 0.30440, lr: 0.607079, top1: 0.64260, throughput: 312.52 | 2022-04-03 10:34:45.040 [rank:0] [train], epoch: 28/50, iter: 300/834, loss: 0.30614, lr: 0.607079, top1: 0.63901, throughput: 312.40 | 2022-04-03 10:34:45.043 [rank:4] [train], epoch: 28/50, iter: 300/834, loss: 0.30592, lr: 0.607079, top1: 0.64021, throughput: 312.44 | 2022-04-03 10:34:45.074 [rank:7] [train], epoch: 28/50, iter: 300/834, loss: 0.30633, lr: 0.607079, top1: 0.63750, throughput: 312.79 | 2022-04-03 10:34:45.000 [rank:6] [train], epoch: 28/50, iter: 300/834, loss: 0.30325, lr: 0.607079, top1: 0.63922, throughput: 312.33 | 2022-04-03 10:34:45.101 [rank:5] [train], epoch: 28/50, iter: 400/834, loss: 0.30570, lr: 0.601426, top1: 0.63766, throughput: 313.84 | 2022-04-03 10:35:46.164 [rank:3] [train], epoch: 28/50, iter: 400/834, loss: 0.30360, lr: 0.601426, top1: 0.64380, throughput: 314.01 | 2022-04-03 10:35:46.173 [rank:0] [train], epoch: 28/50, iter: 400/834, loss: 0.30405, lr: 0.601426, top1: 0.64401, throughput: 314.06 | 2022-04-03 10:35:46.178 [rank:1] [train], epoch: 28/50, iter: 400/834, loss: 0.30800, lr: 0.601426, top1: 0.63646, throughput: 313.93 | 2022-04-03 10:35:46.178 [rank:6] [train], epoch: 28/50, iter: 400/834, loss: 0.30802, lr: 0.601426, top1: 0.63380, throughput: 314.34 | 2022-04-03 10:35:46.181 [rank:7] [train], epoch: 28/50, iter: 400/834, loss: 0.30802, lr: 0.601426, top1: 0.63563, throughput: 313.66 | 2022-04-03 10:35:46.213 [rank:2] [train], epoch: 28/50, iter: 400/834, loss: 0.30371, lr: 0.601426, top1: 0.64172, throughput: 313.81 | 2022-04-03 10:35:46.222 [rank:4] [train], epoch: 28/50, iter: 400/834, loss: 0.30841, lr: 0.601426, top1: 0.63563, throughput: 313.97 | 2022-04-03 10:35:46.227 [rank:7] [train], epoch: 28/50, iter: 500/834, loss: 0.30505, lr: 0.595783, top1: 0.64026, throughput: 312.43 | 2022-04-03 10:36:47.667 [rank:3] [train], epoch: 28/50, iter: 500/834, loss: 0.30619, lr: 0.595783, top1: 0.63615, throughput: 312.20 | 2022-04-03 10:36:47.673 [rank:6] [train], epoch: 28/50, iter: 500/834, loss: 0.30741, lr: 0.595783, top1: 0.63557, throughput: 312.15 | 2022-04-03 10:36:47.691 [rank:1] [train], epoch: 28/50, iter: 500/834, loss: 0.30543, lr: 0.595783, top1: 0.63750, throughput: 312.07 | 2022-04-03 10:36:47.702 [rank:5] [train], epoch: 28/50, iter: 500/834, loss: 0.30707, lr: 0.595783, top1: 0.63245, throughput: 311.97 | 2022-04-03 10:36:47.707 [rank:0] [train], epoch: 28/50, iter: 500/834, loss: 0.30400, lr: 0.595783, top1: 0.64281, throughput: 312.04 | 2022-04-03 10:36:47.709 [rank:4] [train], epoch: 28/50, iter: 500/834, loss: 0.30466, lr: 0.595783, top1: 0.64026, throughput: 312.27 | 2022-04-03 10:36:47.711 [rank:2] [train], epoch: 28/50, iter: 500/834, loss: 0.30535, lr: 0.595783, top1: 0.64474, throughput: 312.52 | 2022-04-03 10:36:47.658 [rank:2] [train], epoch: 28/50, iter: 600/834, loss: 0.30703, lr: 0.590149, top1: 0.63687, throughput: 313.11 | 2022-04-03 10:37:48.978 [rank:5] [train], epoch: 28/50, iter: 600/834, loss: 0.30707, lr: 0.590149, top1: 0.63865, throughput: 313.22 | 2022-04-03 10:37:49.006 [rank:3] [train], epoch: 28/50, iter: 600/834, loss: 0.30579, lr: 0.590149, top1: 0.63849, throughput: 313.05 | 2022-04-03 10:37:49.006 [rank:7] [train], epoch: 28/50, iter: 600/834, loss: 0.30536, lr: 0.590149, top1: 0.64193, throughput: 312.94 | 2022-04-03 10:37:49.020 [rank:4] [train], epoch: 28/50, iter: 600/834, loss: 0.30568, lr: 0.590149, top1: 0.63547, throughput: 313.15 | 2022-04-03 10:37:49.023 [rank:6] [train], epoch: 28/50, iter: 600/834, loss: 0.30928, lr: 0.590149, top1: 0.63719, throughput: 312.96 | 2022-04-03 10:37:49.041 [rank:0] [train], epoch: 28/50, iter: 600/834, loss: 0.30840, lr: 0.590149, top1: 0.63568, throughput: 313.02 | 2022-04-03 10:37:49.047 [rank:1] [train], epoch: 28/50, iter: 600/834, loss: 0.30725, lr: 0.590149, top1: 0.63120, throughput: 312.91 | 2022-04-03 10:37:49.062 [rank:7] [train], epoch: 28/50, iter: 700/834, loss: 0.30576, lr: 0.584525, top1: 0.63979, throughput: 311.85 | 2022-04-03 10:38:50.588 [rank:5] [train], epoch: 28/50, iter: 700/834, loss: 0.30497, lr: 0.584525, top1: 0.63906, throughput: 311.56 | 2022-04-03 10:38:50.631 [rank:6] [train], epoch: 28/50, iter: 700/834, loss: 0.30340, lr: 0.584525, top1: 0.64016, throughput: 311.64 | 2022-04-03 10:38:50.651 [rank:2] [train], epoch: 28/50, iter: 700/834, loss: 0.30684, lr: 0.584525, top1: 0.63516, throughput: 311.30 | 2022-04-03 10:38:50.655 [rank:0] [train], epoch: 28/50, iter: 700/834, loss: 0.30805, lr: 0.584525, top1: 0.63568, throughput: 311.64 | 2022-04-03 10:38:50.658 [rank:1] [train], epoch: 28/50, iter: 700/834, loss: 0.30825, lr: 0.584525, top1: 0.63719, throughput: 311.59 | 2022-04-03 10:38:50.681 [rank:3] [train], epoch: 28/50, iter: 700/834, loss: 0.30716, lr: 0.584525, top1: 0.63682, throughput: 311.29 | 2022-04-03 10:38:50.685 [rank:4] [train], epoch: 28/50, iter: 700/834, loss: 0.30551, lr: 0.584525, top1: 0.64089, throughput: 311.24 | 2022-04-03 10:38:50.711 [rank:3] [train], epoch: 28/50, iter: 800/834, loss: 0.30626, lr: 0.578912, top1: 0.63719, throughput: 313.87 | 2022-04-03 10:39:51.857 [rank:2] [train], epoch: 28/50, iter: 800/834, loss: 0.30988, lr: 0.578912, top1: 0.63167, throughput: 313.71 | 2022-04-03 10:39:51.859 [rank:7] [train], epoch: 28/50, iter: 800/834, loss: 0.31064, lr: 0.578912, top1: 0.63266, throughput: 313.23 | 2022-04-03 10:39:51.884 [rank:0] [train], epoch: 28/50, iter: 800/834, loss: 0.30493, lr: 0.578912, top1: 0.63802, throughput: 313.57 | 2022-04-03 10:39:51.887 [rank:4] [train], epoch: 28/50, iter: 800/834, loss: 0.30790, lr: 0.578912, top1: 0.63427, throughput: 313.82 | 2022-04-03 10:39:51.892 [rank:6] [train], epoch: 28/50, iter: 800/834, loss: 0.30715, lr: 0.578912, top1: 0.63552, throughput: 313.50 | 2022-04-03 10:39:51.895 [rank:1] [train], epoch: 28/50, iter: 800/834, loss: 0.30652, lr: 0.578912, top1: 0.63682, throughput: 313.64 | 2022-04-03 10:39:51.899 [rank:5] [train], epoch: 28/50, iter: 800/834, loss: 0.30831, lr: 0.578912, top1: 0.63510, throughput: 313.25 | 2022-04-03 10:39:51.924 [rank:1] [train], epoch: 28/50, iter: 834/834, loss: 0.30545, lr: 0.577006, top1: 0.63833, throughput: 312.77 | 2022-04-03 10:40:12.770 [rank:3] [train], epoch: 28/50, iter: 834/834, loss: 0.30751, lr: 0.577006, top1: 0.63986, throughput: 312.05 | 2022-04-03 10:40:12.777 [rank:4] [train], epoch: 28/50, iter: 834/834, loss: 0.30510, lr: 0.577006, top1: 0.63894, throughput: 312.45 | 2022-04-03 10:40:12.785 [rank:7] [train], epoch: 28/50, iter: 834/834, loss: 0.30798, lr: 0.577006, top1: 0.62868, throughput: 312.33 | 2022-04-03 10:40:12.786 [rank:0] [train], epoch: 28/50, iter: 834/834, loss: 0.30291, lr: 0.577006, top1: 0.64124, throughput: 312.12 | 2022-04-03 10:40:12.802 [rank:5] [train], epoch: 28/50, iter: 834/834, loss: 0.30062, lr: 0.577006, top1: 0.64844, throughput: 312.66 | 2022-04-03 10:40:12.803 [rank:2] [train], epoch: 28/50, iter: 834/834, loss: 0.30793, lr: 0.577006, top1: 0.63664, throughput: 311.66 | 2022-04-03 10:40:12.805 [rank:6] [train], epoch: 28/50, iter: 834/834, loss: 0.31153, lr: 0.577006, top1: 0.62362, throughput: 311.80 | 2022-04-03 10:40:12.832 [rank:0] [eval], epoch: 28/50, iter: 125/125, loss: 0.00000, lr: 0.577006, top1: 0.64720, throughput: 486.68 | 2022-04-03 10:40:25.644 [rank:1] [eval], epoch: 28/50, iter: 125/125, loss: 0.00000, lr: 0.577006, top1: 0.64512, throughput: 485.36 | 2022-04-03 10:40:25.647 [rank:2] [eval], epoch: 28/50, iter: 125/125, loss: 0.00000, lr: 0.577006, top1: 0.63936, throughput: 486.42 | 2022-04-03 10:40:25.654 [rank:3] [eval], epoch: 28/50, iter: 125/125, loss: 0.00000, lr: 0.577006, top1: 0.64016, throughput: 485.26 | 2022-04-03 10:40:25.657 [rank:5] [eval], epoch: 28/50, iter: 125/125, loss: 0.00000, lr: 0.577006, top1: 0.62512, throughput: 486.02 | 2022-04-03 10:40:25.662 [rank:7] [eval], epoch: 28/50, iter: 125/125, loss: 0.00000, lr: 0.577006, top1: 0.64464, throughput: 485.21 | 2022-04-03 10:40:25.667 [rank:6] [eval], epoch: 28/50, iter: 125/125, loss: 0.00000, lr: 0.577006, top1: 0.64416, throughput: 486.30 | 2022-04-03 10:40:25.684 [rank:4] [eval], epoch: 28/50, iter: 125/125, loss: 0.00000, lr: 0.577006, top1: 0.63744, throughput: 484.25 | 2022-04-03 10:40:25.691 [rank:2] [train], epoch: 29/50, iter: 100/834, loss: 0.29794, lr: 0.571407, top1: 0.65182, throughput: 312.76 | 2022-04-03 10:41:27.043 [rank:1] [train], epoch: 29/50, iter: 100/834, loss: 0.30027, lr: 0.571407, top1: 0.65026, throughput: 312.58 | 2022-04-03 10:41:27.072 [rank:4] [train], epoch: 29/50, iter: 100/834, loss: 0.29997, lr: 0.571407, top1: 0.65177, throughput: 312.76 | 2022-04-03 10:41:27.080 [rank:3] [train], epoch: 29/50, iter: 100/834, loss: 0.29995, lr: 0.571407, top1: 0.65234, throughput: 312.53 | 2022-04-03 10:41:27.091 [rank:7] [train], epoch: 29/50, iter: 100/834, loss: 0.29765, lr: 0.571407, top1: 0.65656, throughput: 312.53 | 2022-04-03 10:41:27.101 [rank:0] [train], epoch: 29/50, iter: 100/834, loss: 0.30108, lr: 0.571407, top1: 0.65000, throughput: 312.40 | 2022-04-03 10:41:27.104 [rank:6] [train], epoch: 29/50, iter: 100/834, loss: 0.29972, lr: 0.571407, top1: 0.65125, throughput: 312.58 | 2022-04-03 10:41:27.108 [rank:5] [train], epoch: 29/50, iter: 100/834, loss: 0.29731, lr: 0.571407, top1: 0.65443, throughput: 312.45 | 2022-04-03 10:41:27.113 [rank:1] [train], epoch: 29/50, iter: 200/834, loss: 0.30124, lr: 0.565820, top1: 0.64698, throughput: 312.59 | 2022-04-03 10:42:28.494 [rank:3] [train], epoch: 29/50, iter: 200/834, loss: 0.30092, lr: 0.565820, top1: 0.64474, throughput: 312.64 | 2022-04-03 10:42:28.504 [rank:7] [train], epoch: 29/50, iter: 200/834, loss: 0.30059, lr: 0.565820, top1: 0.65339, throughput: 312.68 | 2022-04-03 10:42:28.505 [rank:5] [train], epoch: 29/50, iter: 200/834, loss: 0.30093, lr: 0.565820, top1: 0.64875, throughput: 312.65 | 2022-04-03 10:42:28.523 [rank:4] [train], epoch: 29/50, iter: 200/834, loss: 0.30151, lr: 0.565820, top1: 0.64500, throughput: 312.43 | 2022-04-03 10:42:28.533 [rank:6] [train], epoch: 29/50, iter: 200/834, loss: 0.29980, lr: 0.565820, top1: 0.65036, throughput: 312.57 | 2022-04-03 10:42:28.535 [rank:0] [train], epoch: 29/50, iter: 200/834, loss: 0.30093, lr: 0.565820, top1: 0.64911, throughput: 312.43 | 2022-04-03 10:42:28.557 [rank:2] [train], epoch: 29/50, iter: 200/834, loss: 0.30199, lr: 0.565820, top1: 0.64229, throughput: 312.47 | 2022-04-03 10:42:28.488 [rank:2] [train], epoch: 29/50, iter: 300/834, loss: 0.29922, lr: 0.560244, top1: 0.65073, throughput: 312.67 | 2022-04-03 10:43:29.894 [rank:5] [train], epoch: 29/50, iter: 300/834, loss: 0.30297, lr: 0.560244, top1: 0.64552, throughput: 312.75 | 2022-04-03 10:43:29.913 [rank:7] [train], epoch: 29/50, iter: 300/834, loss: 0.30348, lr: 0.560244, top1: 0.64646, throughput: 312.53 | 2022-04-03 10:43:29.940 [rank:3] [train], epoch: 29/50, iter: 300/834, loss: 0.30366, lr: 0.560244, top1: 0.64365, throughput: 312.49 | 2022-04-03 10:43:29.946 [rank:0] [train], epoch: 29/50, iter: 300/834, loss: 0.30112, lr: 0.560244, top1: 0.64583, throughput: 312.72 | 2022-04-03 10:43:29.953 [rank:4] [train], epoch: 29/50, iter: 300/834, loss: 0.30175, lr: 0.560244, top1: 0.64526, throughput: 312.57 | 2022-04-03 10:43:29.959 [rank:6] [train], epoch: 29/50, iter: 300/834, loss: 0.30309, lr: 0.560244, top1: 0.64417, throughput: 312.57 | 2022-04-03 10:43:29.961 [rank:1] [train], epoch: 29/50, iter: 300/834, loss: 0.30393, lr: 0.560244, top1: 0.64422, throughput: 312.31 | 2022-04-03 10:43:29.972 [rank:7] [train], epoch: 29/50, iter: 400/834, loss: 0.30223, lr: 0.554680, top1: 0.64505, throughput: 312.54 | 2022-04-03 10:44:31.372 [rank:6] [train], epoch: 29/50, iter: 400/834, loss: 0.30182, lr: 0.554680, top1: 0.64755, throughput: 312.59 | 2022-04-03 10:44:31.382 [rank:3] [train], epoch: 29/50, iter: 400/834, loss: 0.30191, lr: 0.554680, top1: 0.64589, throughput: 312.51 | 2022-04-03 10:44:31.383 [rank:0] [train], epoch: 29/50, iter: 400/834, loss: 0.30274, lr: 0.554680, top1: 0.64391, throughput: 312.53 | 2022-04-03 10:44:31.387 [rank:2] [train], epoch: 29/50, iter: 400/834, loss: 0.30501, lr: 0.554680, top1: 0.64161, throughput: 312.22 | 2022-04-03 10:44:31.390 [rank:1] [train], epoch: 29/50, iter: 400/834, loss: 0.30359, lr: 0.554680, top1: 0.64349, throughput: 312.86 | 2022-04-03 10:44:31.342 [rank:5] [train], epoch: 29/50, iter: 400/834, loss: 0.30493, lr: 0.554680, top1: 0.64062, throughput: 312.01 | 2022-04-03 10:44:31.450 [rank:4] [train], epoch: 29/50, iter: 400/834, loss: 0.30222, lr: 0.554680, top1: 0.64182, throughput: 312.19 | 2022-04-03 10:44:31.459 [rank:5] [train], epoch: 29/50, iter: 500/834, loss: 0.30351, lr: 0.549127, top1: 0.64208, throughput: 313.03 | 2022-04-03 10:45:32.787 [rank:1] [train], epoch: 29/50, iter: 500/834, loss: 0.29993, lr: 0.549127, top1: 0.64927, throughput: 312.46 | 2022-04-03 10:45:32.789 [rank:4] [train], epoch: 29/50, iter: 500/834, loss: 0.30366, lr: 0.549127, top1: 0.64344, throughput: 312.88 | 2022-04-03 10:45:32.824 [rank:3] [train], epoch: 29/50, iter: 500/834, loss: 0.30382, lr: 0.549127, top1: 0.64318, throughput: 312.47 | 2022-04-03 10:45:32.828 [rank:6] [train], epoch: 29/50, iter: 500/834, loss: 0.30337, lr: 0.549127, top1: 0.64109, throughput: 312.30 | 2022-04-03 10:45:32.862 [rank:7] [train], epoch: 29/50, iter: 500/834, loss: 0.30300, lr: 0.549127, top1: 0.64255, throughput: 312.23 | 2022-04-03 10:45:32.866 [rank:2] [train], epoch: 29/50, iter: 500/834, loss: 0.30249, lr: 0.549127, top1: 0.64385, throughput: 312.21 | 2022-04-03 10:45:32.887 [rank:0] [train], epoch: 29/50, iter: 500/834, loss: 0.30053, lr: 0.549127, top1: 0.65141, throughput: 312.62 | 2022-04-03 10:45:32.803 [rank:3] [train], epoch: 29/50, iter: 600/834, loss: 0.30311, lr: 0.543588, top1: 0.64630, throughput: 311.47 | 2022-04-03 10:46:34.471 [rank:7] [train], epoch: 29/50, iter: 600/834, loss: 0.30485, lr: 0.543588, top1: 0.63896, throughput: 311.58 | 2022-04-03 10:46:34.487 [rank:2] [train], epoch: 29/50, iter: 600/834, loss: 0.30415, lr: 0.543588, top1: 0.64214, throughput: 311.57 | 2022-04-03 10:46:34.511 [rank:0] [train], epoch: 29/50, iter: 600/834, loss: 0.30268, lr: 0.543588, top1: 0.64672, throughput: 311.07 | 2022-04-03 10:46:34.524 [rank:6] [train], epoch: 29/50, iter: 600/834, loss: 0.30580, lr: 0.543588, top1: 0.63875, throughput: 311.37 | 2022-04-03 10:46:34.525 [rank:4] [train], epoch: 29/50, iter: 600/834, loss: 0.30346, lr: 0.543588, top1: 0.63875, throughput: 311.11 | 2022-04-03 10:46:34.539 [rank:5] [train], epoch: 29/50, iter: 600/834, loss: 0.30474, lr: 0.543588, top1: 0.64339, throughput: 310.91 | 2022-04-03 10:46:34.540 [rank:1] [train], epoch: 29/50, iter: 600/834, loss: 0.30142, lr: 0.543588, top1: 0.64630, throughput: 310.85 | 2022-04-03 10:46:34.556 [rank:1] [train], epoch: 29/50, iter: 700/834, loss: 0.30276, lr: 0.538061, top1: 0.64302, throughput: 315.47 | 2022-04-03 10:47:35.417 [rank:5] [train], epoch: 29/50, iter: 700/834, loss: 0.30186, lr: 0.538061, top1: 0.64328, throughput: 315.29 | 2022-04-03 10:47:35.438 [rank:2] [train], epoch: 29/50, iter: 700/834, loss: 0.30307, lr: 0.538061, top1: 0.64604, throughput: 315.13 | 2022-04-03 10:47:35.439 [rank:3] [train], epoch: 29/50, iter: 700/834, loss: 0.30297, lr: 0.538061, top1: 0.64510, throughput: 314.86 | 2022-04-03 10:47:35.451 [rank:7] [train], epoch: 29/50, iter: 700/834, loss: 0.30236, lr: 0.538061, top1: 0.64396, throughput: 314.92 | 2022-04-03 10:47:35.455 [rank:4] [train], epoch: 29/50, iter: 700/834, loss: 0.30600, lr: 0.538061, top1: 0.63776, throughput: 315.07 | 2022-04-03 10:47:35.479 [rank:0] [train], epoch: 29/50, iter: 700/834, loss: 0.30415, lr: 0.538061, top1: 0.64229, throughput: 314.96 | 2022-04-03 10:47:35.485 [rank:6] [train], epoch: 29/50, iter: 700/834, loss: 0.30236, lr: 0.538061, top1: 0.64385, throughput: 314.81 | 2022-04-03 10:47:35.514 [rank:1] [train], epoch: 29/50, iter: 800/834, loss: 0.30232, lr: 0.532547, top1: 0.64495, throughput: 310.65 | 2022-04-03 10:48:37.223 [rank:5] [train], epoch: 29/50, iter: 800/834, loss: 0.30228, lr: 0.532547, top1: 0.64573, throughput: 310.70 | 2022-04-03 10:48:37.234 [rank:4] [train], epoch: 29/50, iter: 800/834, loss: 0.30079, lr: 0.532547, top1: 0.64875, throughput: 310.83 | 2022-04-03 10:48:37.248 [rank:2] [train], epoch: 29/50, iter: 800/834, loss: 0.30095, lr: 0.532547, top1: 0.65068, throughput: 310.63 | 2022-04-03 10:48:37.249 [rank:6] [train], epoch: 29/50, iter: 800/834, loss: 0.30546, lr: 0.532547, top1: 0.63484, throughput: 310.98 | 2022-04-03 10:48:37.254 [rank:0] [train], epoch: 29/50, iter: 800/834, loss: 0.30297, lr: 0.532547, top1: 0.64427, throughput: 310.82 | 2022-04-03 10:48:37.257 [rank:3] [train], epoch: 29/50, iter: 800/834, loss: 0.30333, lr: 0.532547, top1: 0.64193, throughput: 310.62 | 2022-04-03 10:48:37.263 [rank:7] [train], epoch: 29/50, iter: 800/834, loss: 0.30596, lr: 0.532547, top1: 0.63745, throughput: 310.50 | 2022-04-03 10:48:37.290 [rank:2] [train], epoch: 29/50, iter: 834/834, loss: 0.30432, lr: 0.530675, top1: 0.64415, throughput: 312.48 | 2022-04-03 10:48:58.140 [rank:3] [train], epoch: 29/50, iter: 834/834, loss: 0.30654, lr: 0.530675, top1: 0.63097, throughput: 312.64 | 2022-04-03 10:48:58.143 [rank:4] [train], epoch: 29/50, iter: 834/834, loss: 0.30217, lr: 0.530675, top1: 0.64859, throughput: 312.37 | 2022-04-03 10:48:58.146 [rank:0] [train], epoch: 29/50, iter: 834/834, loss: 0.30429, lr: 0.530675, top1: 0.64369, throughput: 312.49 | 2022-04-03 10:48:58.148 [rank:6] [train], epoch: 29/50, iter: 834/834, loss: 0.30753, lr: 0.530675, top1: 0.63312, throughput: 312.38 | 2022-04-03 10:48:58.152 [rank:7] [train], epoch: 29/50, iter: 834/834, loss: 0.30759, lr: 0.530675, top1: 0.62868, throughput: 312.83 | 2022-04-03 10:48:58.158 [rank:5] [train], epoch: 29/50, iter: 834/834, loss: 0.30416, lr: 0.530675, top1: 0.63771, throughput: 311.49 | 2022-04-03 10:48:58.192 [rank:1] [train], epoch: 29/50, iter: 834/834, loss: 0.29982, lr: 0.530675, top1: 0.65257, throughput: 311.24 | 2022-04-03 10:48:58.198 [rank:0] [eval], epoch: 29/50, iter: 125/125, loss: 0.00000, lr: 0.530675, top1: 0.64112, throughput: 479.36 | 2022-04-03 10:49:11.186 [rank:2] [eval], epoch: 29/50, iter: 125/125, loss: 0.00000, lr: 0.530675, top1: 0.63632, throughput: 478.97 | 2022-04-03 10:49:11.189 [rank:1] [eval], epoch: 29/50, iter: 125/125, loss: 0.00000, lr: 0.530675, top1: 0.63584, throughput: 481.07 | 2022-04-03 10:49:11.190 [rank:3] [eval], epoch: 29/50, iter: 125/125, loss: 0.00000, lr: 0.530675, top1: 0.64480, throughput: 478.72 | 2022-04-03 10:49:11.199 [rank:5] [eval], epoch: 29/50, iter: 125/125, loss: 0.00000, lr: 0.530675, top1: 0.63408, throughput: 480.22 | 2022-04-03 10:49:11.207 [rank:7] [eval], epoch: 29/50, iter: 125/125, loss: 0.00000, lr: 0.530675, top1: 0.64800, throughput: 478.86 | 2022-04-03 10:49:11.209 [rank:6] [eval], epoch: 29/50, iter: 125/125, loss: 0.00000, lr: 0.530675, top1: 0.64560, throughput: 477.69 | 2022-04-03 10:49:11.235 [rank:4] [eval], epoch: 29/50, iter: 125/125, loss: 0.00000, lr: 0.530675, top1: 0.63648, throughput: 477.38 | 2022-04-03 10:49:11.238 [rank:5] [train], epoch: 30/50, iter: 100/834, loss: 0.29841, lr: 0.525179, top1: 0.64823, throughput: 312.97 | 2022-04-03 10:50:12.554 [rank:6] [train], epoch: 30/50, iter: 100/834, loss: 0.29806, lr: 0.525179, top1: 0.65776, throughput: 312.97 | 2022-04-03 10:50:12.583 [rank:2] [train], epoch: 30/50, iter: 100/834, loss: 0.29697, lr: 0.525179, top1: 0.65333, throughput: 312.62 | 2022-04-03 10:50:12.605 [rank:1] [train], epoch: 30/50, iter: 100/834, loss: 0.29334, lr: 0.525179, top1: 0.66453, throughput: 312.55 | 2022-04-03 10:50:12.620 [rank:4] [train], epoch: 30/50, iter: 100/834, loss: 0.29942, lr: 0.525179, top1: 0.65208, throughput: 312.65 | 2022-04-03 10:50:12.650 [rank:3] [train], epoch: 30/50, iter: 100/834, loss: 0.29886, lr: 0.525179, top1: 0.65073, throughput: 312.44 | 2022-04-03 10:50:12.651 [rank:0] [train], epoch: 30/50, iter: 100/834, loss: 0.29739, lr: 0.525179, top1: 0.65604, throughput: 312.36 | 2022-04-03 10:50:12.653 [rank:7] [train], epoch: 30/50, iter: 100/834, loss: 0.29634, lr: 0.525179, top1: 0.65630, throughput: 312.85 | 2022-04-03 10:50:12.581 [rank:1] [train], epoch: 30/50, iter: 200/834, loss: 0.29900, lr: 0.519697, top1: 0.65495, throughput: 313.63 | 2022-04-03 10:51:13.839 [rank:2] [train], epoch: 30/50, iter: 200/834, loss: 0.29837, lr: 0.519697, top1: 0.65411, throughput: 313.37 | 2022-04-03 10:51:13.875 [rank:7] [train], epoch: 30/50, iter: 200/834, loss: 0.29938, lr: 0.519697, top1: 0.64984, throughput: 313.24 | 2022-04-03 10:51:13.877 [rank:3] [train], epoch: 30/50, iter: 200/834, loss: 0.29672, lr: 0.519697, top1: 0.65552, throughput: 313.57 | 2022-04-03 10:51:13.881 [rank:0] [train], epoch: 30/50, iter: 200/834, loss: 0.29697, lr: 0.519697, top1: 0.65786, throughput: 313.57 | 2022-04-03 10:51:13.882 [rank:5] [train], epoch: 30/50, iter: 200/834, loss: 0.29779, lr: 0.519697, top1: 0.65292, throughput: 312.99 | 2022-04-03 10:51:13.897 [rank:6] [train], epoch: 30/50, iter: 200/834, loss: 0.29787, lr: 0.519697, top1: 0.65328, throughput: 313.13 | 2022-04-03 10:51:13.899 [rank:4] [train], epoch: 30/50, iter: 200/834, loss: 0.29753, lr: 0.519697, top1: 0.65260, throughput: 313.44 | 2022-04-03 10:51:13.905 [rank:6] [train], epoch: 30/50, iter: 300/834, loss: 0.29996, lr: 0.514229, top1: 0.64807, throughput: 313.19 | 2022-04-03 10:52:15.205 [rank:5] [train], epoch: 30/50, iter: 300/834, loss: 0.29773, lr: 0.514229, top1: 0.65734, throughput: 313.07 | 2022-04-03 10:52:15.226 [rank:0] [train], epoch: 30/50, iter: 300/834, loss: 0.29747, lr: 0.514229, top1: 0.65281, throughput: 312.91 | 2022-04-03 10:52:15.243 [rank:1] [train], epoch: 30/50, iter: 300/834, loss: 0.29996, lr: 0.514229, top1: 0.65068, throughput: 312.62 | 2022-04-03 10:52:15.255 [rank:2] [train], epoch: 30/50, iter: 300/834, loss: 0.30011, lr: 0.514229, top1: 0.64812, throughput: 312.74 | 2022-04-03 10:52:15.267 [rank:7] [train], epoch: 30/50, iter: 300/834, loss: 0.29904, lr: 0.514229, top1: 0.65016, throughput: 312.71 | 2022-04-03 10:52:15.275 [rank:4] [train], epoch: 30/50, iter: 300/834, loss: 0.30066, lr: 0.514229, top1: 0.64734, throughput: 312.82 | 2022-04-03 10:52:15.282 [rank:3] [train], epoch: 30/50, iter: 300/834, loss: 0.29844, lr: 0.514229, top1: 0.65516, throughput: 312.65 | 2022-04-03 10:52:15.292 [rank:3] [train], epoch: 30/50, iter: 400/834, loss: 0.29791, lr: 0.508775, top1: 0.65328, throughput: 312.53 | 2022-04-03 10:53:16.727 [rank:7] [train], epoch: 30/50, iter: 400/834, loss: 0.29945, lr: 0.508775, top1: 0.65036, throughput: 312.28 | 2022-04-03 10:53:16.758 [rank:6] [train], epoch: 30/50, iter: 400/834, loss: 0.29754, lr: 0.508775, top1: 0.65531, throughput: 311.89 | 2022-04-03 10:53:16.765 [rank:5] [train], epoch: 30/50, iter: 400/834, loss: 0.29892, lr: 0.508775, top1: 0.64964, throughput: 311.99 | 2022-04-03 10:53:16.766 [rank:4] [train], epoch: 30/50, iter: 400/834, loss: 0.29975, lr: 0.508775, top1: 0.64792, throughput: 312.18 | 2022-04-03 10:53:16.786 [rank:2] [train], epoch: 30/50, iter: 400/834, loss: 0.30144, lr: 0.508775, top1: 0.64542, throughput: 311.95 | 2022-04-03 10:53:16.816 [rank:1] [train], epoch: 30/50, iter: 400/834, loss: 0.30318, lr: 0.508775, top1: 0.64495, throughput: 311.80 | 2022-04-03 10:53:16.833 [rank:0] [train], epoch: 30/50, iter: 400/834, loss: 0.29801, lr: 0.508775, top1: 0.65469, throughput: 312.13 | 2022-04-03 10:53:16.755 [rank:5] [train], epoch: 30/50, iter: 500/834, loss: 0.30007, lr: 0.503336, top1: 0.64740, throughput: 311.72 | 2022-04-03 10:54:18.358 [rank:7] [train], epoch: 30/50, iter: 500/834, loss: 0.29834, lr: 0.503336, top1: 0.65245, throughput: 311.68 | 2022-04-03 10:54:18.359 [rank:6] [train], epoch: 30/50, iter: 500/834, loss: 0.29931, lr: 0.503336, top1: 0.65599, throughput: 311.72 | 2022-04-03 10:54:18.359 [rank:4] [train], epoch: 30/50, iter: 500/834, loss: 0.29751, lr: 0.503336, top1: 0.65078, throughput: 311.76 | 2022-04-03 10:54:18.372 [rank:2] [train], epoch: 30/50, iter: 500/834, loss: 0.30271, lr: 0.503336, top1: 0.64224, throughput: 311.74 | 2022-04-03 10:54:18.406 [rank:1] [train], epoch: 30/50, iter: 500/834, loss: 0.30110, lr: 0.503336, top1: 0.64620, throughput: 311.81 | 2022-04-03 10:54:18.409 [rank:0] [train], epoch: 30/50, iter: 500/834, loss: 0.30131, lr: 0.503336, top1: 0.64865, throughput: 311.36 | 2022-04-03 10:54:18.419 [rank:3] [train], epoch: 30/50, iter: 500/834, loss: 0.29916, lr: 0.503336, top1: 0.65401, throughput: 311.22 | 2022-04-03 10:54:18.420 [rank:2] [train], epoch: 30/50, iter: 600/834, loss: 0.30004, lr: 0.497912, top1: 0.65005, throughput: 312.03 | 2022-04-03 10:55:19.939 [rank:1] [train], epoch: 30/50, iter: 600/834, loss: 0.29761, lr: 0.497912, top1: 0.65510, throughput: 312.00 | 2022-04-03 10:55:19.948 [rank:0] [train], epoch: 30/50, iter: 600/834, loss: 0.29864, lr: 0.497912, top1: 0.64906, throughput: 311.91 | 2022-04-03 10:55:19.976 [rank:5] [train], epoch: 30/50, iter: 600/834, loss: 0.30059, lr: 0.497912, top1: 0.65073, throughput: 311.56 | 2022-04-03 10:55:19.983 [rank:4] [train], epoch: 30/50, iter: 600/834, loss: 0.30177, lr: 0.497912, top1: 0.64724, throughput: 311.62 | 2022-04-03 10:55:19.984 [rank:3] [train], epoch: 30/50, iter: 600/834, loss: 0.30071, lr: 0.497912, top1: 0.64891, throughput: 311.83 | 2022-04-03 10:55:19.991 [rank:6] [train], epoch: 30/50, iter: 600/834, loss: 0.29923, lr: 0.497912, top1: 0.65266, throughput: 311.35 | 2022-04-03 10:55:20.026 [rank:7] [train], epoch: 30/50, iter: 600/834, loss: 0.29572, lr: 0.497912, top1: 0.65667, throughput: 311.35 | 2022-04-03 10:55:20.027 [rank:6] [train], epoch: 30/50, iter: 700/834, loss: 0.30080, lr: 0.492503, top1: 0.65089, throughput: 313.70 | 2022-04-03 10:56:21.232 [rank:1] [train], epoch: 30/50, iter: 700/834, loss: 0.29734, lr: 0.492503, top1: 0.65729, throughput: 313.29 | 2022-04-03 10:56:21.233 [rank:4] [train], epoch: 30/50, iter: 700/834, loss: 0.29867, lr: 0.492503, top1: 0.65292, throughput: 313.37 | 2022-04-03 10:56:21.254 [rank:5] [train], epoch: 30/50, iter: 700/834, loss: 0.30051, lr: 0.492503, top1: 0.65130, throughput: 313.34 | 2022-04-03 10:56:21.259 [rank:2] [train], epoch: 30/50, iter: 700/834, loss: 0.30060, lr: 0.492503, top1: 0.64198, throughput: 313.11 | 2022-04-03 10:56:21.259 [rank:3] [train], epoch: 30/50, iter: 700/834, loss: 0.29698, lr: 0.492503, top1: 0.65620, throughput: 313.31 | 2022-04-03 10:56:21.271 [rank:7] [train], epoch: 30/50, iter: 700/834, loss: 0.29814, lr: 0.492503, top1: 0.65146, throughput: 313.47 | 2022-04-03 10:56:21.277 [rank:0] [train], epoch: 30/50, iter: 700/834, loss: 0.30045, lr: 0.492503, top1: 0.65130, throughput: 313.11 | 2022-04-03 10:56:21.296 [rank:6] [train], epoch: 30/50, iter: 800/834, loss: 0.30032, lr: 0.487110, top1: 0.65016, throughput: 312.76 | 2022-04-03 10:57:22.622 [rank:7] [train], epoch: 30/50, iter: 800/834, loss: 0.30044, lr: 0.487110, top1: 0.65000, throughput: 312.80 | 2022-04-03 10:57:22.657 [rank:4] [train], epoch: 30/50, iter: 800/834, loss: 0.29954, lr: 0.487110, top1: 0.65156, throughput: 312.68 | 2022-04-03 10:57:22.659 [rank:0] [train], epoch: 30/50, iter: 800/834, loss: 0.29839, lr: 0.487110, top1: 0.64932, throughput: 312.89 | 2022-04-03 10:57:22.660 [rank:5] [train], epoch: 30/50, iter: 800/834, loss: 0.29825, lr: 0.487110, top1: 0.65234, throughput: 312.68 | 2022-04-03 10:57:22.664 [rank:3] [train], epoch: 30/50, iter: 800/834, loss: 0.29842, lr: 0.487110, top1: 0.65083, throughput: 312.73 | 2022-04-03 10:57:22.666 [rank:2] [train], epoch: 30/50, iter: 800/834, loss: 0.29953, lr: 0.487110, top1: 0.64703, throughput: 312.63 | 2022-04-03 10:57:22.673 [rank:1] [train], epoch: 30/50, iter: 800/834, loss: 0.30051, lr: 0.487110, top1: 0.65089, throughput: 312.37 | 2022-04-03 10:57:22.699 [rank:2] [train], epoch: 30/50, iter: 834/834, loss: 0.29925, lr: 0.485280, top1: 0.65579, throughput: 312.05 | 2022-04-03 10:57:43.593 [rank:6] [train], epoch: 30/50, iter: 834/834, loss: 0.30324, lr: 0.485280, top1: 0.64338, throughput: 311.11 | 2022-04-03 10:57:43.604 [rank:0] [train], epoch: 30/50, iter: 834/834, loss: 0.29872, lr: 0.485280, top1: 0.65594, throughput: 311.56 | 2022-04-03 10:57:43.613 [rank:4] [train], epoch: 30/50, iter: 834/834, loss: 0.30086, lr: 0.485280, top1: 0.64537, throughput: 311.46 | 2022-04-03 10:57:43.619 [rank:1] [train], epoch: 30/50, iter: 834/834, loss: 0.29995, lr: 0.485280, top1: 0.64568, throughput: 311.92 | 2022-04-03 10:57:43.628 [rank:5] [train], epoch: 30/50, iter: 834/834, loss: 0.29681, lr: 0.485280, top1: 0.65809, throughput: 311.18 | 2022-04-03 10:57:43.643 [rank:3] [train], epoch: 30/50, iter: 834/834, loss: 0.29819, lr: 0.485280, top1: 0.64737, throughput: 311.11 | 2022-04-03 10:57:43.649 [rank:7] [train], epoch: 30/50, iter: 834/834, loss: 0.30167, lr: 0.485280, top1: 0.64798, throughput: 310.80 | 2022-04-03 10:57:43.661 [rank:0] [eval], epoch: 30/50, iter: 125/125, loss: 0.00000, lr: 0.485280, top1: 0.65328, throughput: 485.30 | 2022-04-03 10:57:56.491 [rank:2] [eval], epoch: 30/50, iter: 125/125, loss: 0.00000, lr: 0.485280, top1: 0.64432, throughput: 484.37 | 2022-04-03 10:57:56.496 [rank:1] [eval], epoch: 30/50, iter: 125/125, loss: 0.00000, lr: 0.485280, top1: 0.64960, throughput: 485.65 | 2022-04-03 10:57:56.497 [rank:3] [eval], epoch: 30/50, iter: 125/125, loss: 0.00000, lr: 0.485280, top1: 0.64368, throughput: 486.09 | 2022-04-03 10:57:56.507 [rank:4] [eval], epoch: 30/50, iter: 125/125, loss: 0.00000, lr: 0.485280, top1: 0.64400, throughput: 484.90 | 2022-04-03 10:57:56.508 [rank:5] [eval], epoch: 30/50, iter: 125/125, loss: 0.00000, lr: 0.485280, top1: 0.64368, throughput: 485.64 | 2022-04-03 10:57:56.512 [rank:7] [eval], epoch: 30/50, iter: 125/125, loss: 0.00000, lr: 0.485280, top1: 0.65152, throughput: 485.62 | 2022-04-03 10:57:56.532 [rank:6] [eval], epoch: 30/50, iter: 125/125, loss: 0.00000, lr: 0.485280, top1: 0.65376, throughput: 482.85 | 2022-04-03 10:57:56.548 [rank:6] [train], epoch: 31/50, iter: 100/834, loss: 0.29422, lr: 0.479909, top1: 0.66031, throughput: 313.36 | 2022-04-03 10:58:57.820 [rank:7] [train], epoch: 31/50, iter: 100/834, loss: 0.29230, lr: 0.479909, top1: 0.66703, throughput: 313.27 | 2022-04-03 10:58:57.821 [rank:5] [train], epoch: 31/50, iter: 100/834, loss: 0.28850, lr: 0.479909, top1: 0.67255, throughput: 313.11 | 2022-04-03 10:58:57.832 [rank:2] [train], epoch: 31/50, iter: 100/834, loss: 0.29356, lr: 0.479909, top1: 0.66099, throughput: 313.02 | 2022-04-03 10:58:57.835 [rank:1] [train], epoch: 31/50, iter: 100/834, loss: 0.29088, lr: 0.479909, top1: 0.67047, throughput: 312.96 | 2022-04-03 10:58:57.846 [rank:4] [train], epoch: 31/50, iter: 100/834, loss: 0.29335, lr: 0.479909, top1: 0.66531, throughput: 313.01 | 2022-04-03 10:58:57.849 [rank:0] [train], epoch: 31/50, iter: 100/834, loss: 0.29340, lr: 0.479909, top1: 0.66349, throughput: 312.88 | 2022-04-03 10:58:57.856 [rank:3] [train], epoch: 31/50, iter: 100/834, loss: 0.29127, lr: 0.479909, top1: 0.66464, throughput: 312.95 | 2022-04-03 10:58:57.859 [rank:5] [train], epoch: 31/50, iter: 200/834, loss: 0.29522, lr: 0.474554, top1: 0.65562, throughput: 313.16 | 2022-04-03 10:59:59.142 [rank:1] [train], epoch: 31/50, iter: 200/834, loss: 0.29363, lr: 0.474554, top1: 0.66255, throughput: 313.16 | 2022-04-03 10:59:59.158 [rank:7] [train], epoch: 31/50, iter: 200/834, loss: 0.29656, lr: 0.474554, top1: 0.65531, throughput: 313.01 | 2022-04-03 10:59:59.161 [rank:6] [train], epoch: 31/50, iter: 200/834, loss: 0.29669, lr: 0.474554, top1: 0.65370, throughput: 312.93 | 2022-04-03 10:59:59.176 [rank:2] [train], epoch: 31/50, iter: 200/834, loss: 0.29061, lr: 0.474554, top1: 0.67031, throughput: 312.98 | 2022-04-03 10:59:59.180 [rank:3] [train], epoch: 31/50, iter: 200/834, loss: 0.29365, lr: 0.474554, top1: 0.66344, throughput: 313.07 | 2022-04-03 10:59:59.188 [rank:0] [train], epoch: 31/50, iter: 200/834, loss: 0.29737, lr: 0.474554, top1: 0.65786, throughput: 312.89 | 2022-04-03 10:59:59.219 [rank:4] [train], epoch: 31/50, iter: 200/834, loss: 0.29164, lr: 0.474554, top1: 0.66536, throughput: 313.19 | 2022-04-03 10:59:59.154 [rank:6] [train], epoch: 31/50, iter: 300/834, loss: 0.29856, lr: 0.469215, top1: 0.65250, throughput: 312.33 | 2022-04-03 11:01:00.649 [rank:0] [train], epoch: 31/50, iter: 300/834, loss: 0.29516, lr: 0.469215, top1: 0.65969, throughput: 312.52 | 2022-04-03 11:01:00.656 [rank:5] [train], epoch: 31/50, iter: 300/834, loss: 0.29639, lr: 0.469215, top1: 0.65391, throughput: 312.10 | 2022-04-03 11:01:00.661 [rank:2] [train], epoch: 31/50, iter: 300/834, loss: 0.29481, lr: 0.469215, top1: 0.65906, throughput: 312.27 | 2022-04-03 11:01:00.666 [rank:7] [train], epoch: 31/50, iter: 300/834, loss: 0.29517, lr: 0.469215, top1: 0.65807, throughput: 312.04 | 2022-04-03 11:01:00.692 [rank:3] [train], epoch: 31/50, iter: 300/834, loss: 0.29484, lr: 0.469215, top1: 0.66318, throughput: 312.15 | 2022-04-03 11:01:00.696 [rank:4] [train], epoch: 31/50, iter: 300/834, loss: 0.29637, lr: 0.469215, top1: 0.65583, throughput: 311.99 | 2022-04-03 11:01:00.696 [rank:1] [train], epoch: 31/50, iter: 300/834, loss: 0.29451, lr: 0.469215, top1: 0.66557, throughput: 312.00 | 2022-04-03 11:01:00.695 [rank:6] [train], epoch: 31/50, iter: 400/834, loss: 0.29602, lr: 0.463893, top1: 0.65130, throughput: 312.78 | 2022-04-03 11:02:02.034 [rank:1] [train], epoch: 31/50, iter: 400/834, loss: 0.29887, lr: 0.463893, top1: 0.65271, throughput: 312.98 | 2022-04-03 11:02:02.041 [rank:3] [train], epoch: 31/50, iter: 400/834, loss: 0.29428, lr: 0.463893, top1: 0.66005, throughput: 312.96 | 2022-04-03 11:02:02.045 [rank:4] [train], epoch: 31/50, iter: 400/834, loss: 0.29405, lr: 0.463893, top1: 0.66411, throughput: 312.95 | 2022-04-03 11:02:02.047 [rank:0] [train], epoch: 31/50, iter: 400/834, loss: 0.29923, lr: 0.463893, top1: 0.65167, throughput: 312.75 | 2022-04-03 11:02:02.047 [rank:2] [train], epoch: 31/50, iter: 400/834, loss: 0.29686, lr: 0.463893, top1: 0.65604, throughput: 312.73 | 2022-04-03 11:02:02.061 [rank:5] [train], epoch: 31/50, iter: 400/834, loss: 0.29396, lr: 0.463893, top1: 0.66057, throughput: 312.70 | 2022-04-03 11:02:02.061 [rank:7] [train], epoch: 31/50, iter: 400/834, loss: 0.29518, lr: 0.463893, top1: 0.65766, throughput: 312.76 | 2022-04-03 11:02:02.082 [rank:6] [train], epoch: 31/50, iter: 500/834, loss: 0.29540, lr: 0.458589, top1: 0.65745, throughput: 313.74 | 2022-04-03 11:03:03.232 [rank:2] [train], epoch: 31/50, iter: 500/834, loss: 0.29502, lr: 0.458589, top1: 0.65979, throughput: 313.72 | 2022-04-03 11:03:03.262 [rank:5] [train], epoch: 31/50, iter: 500/834, loss: 0.29654, lr: 0.458589, top1: 0.65745, throughput: 313.65 | 2022-04-03 11:03:03.277 [rank:7] [train], epoch: 31/50, iter: 500/834, loss: 0.29581, lr: 0.458589, top1: 0.65984, throughput: 313.67 | 2022-04-03 11:03:03.293 [rank:4] [train], epoch: 31/50, iter: 500/834, loss: 0.29627, lr: 0.458589, top1: 0.65839, throughput: 313.36 | 2022-04-03 11:03:03.319 [rank:1] [train], epoch: 31/50, iter: 500/834, loss: 0.29522, lr: 0.458589, top1: 0.65687, throughput: 313.30 | 2022-04-03 11:03:03.325 [rank:3] [train], epoch: 31/50, iter: 500/834, loss: 0.29727, lr: 0.458589, top1: 0.65578, throughput: 313.28 | 2022-04-03 11:03:03.332 [rank:0] [train], epoch: 31/50, iter: 500/834, loss: 0.29600, lr: 0.458589, top1: 0.65349, throughput: 313.21 | 2022-04-03 11:03:03.347 [rank:5] [train], epoch: 31/50, iter: 600/834, loss: 0.29704, lr: 0.453302, top1: 0.65870, throughput: 313.50 | 2022-04-03 11:04:04.520 [rank:3] [train], epoch: 31/50, iter: 600/834, loss: 0.30056, lr: 0.453302, top1: 0.64719, throughput: 313.72 | 2022-04-03 11:04:04.533 [rank:1] [train], epoch: 31/50, iter: 600/834, loss: 0.29700, lr: 0.453302, top1: 0.65047, throughput: 313.63 | 2022-04-03 11:04:04.544 [rank:4] [train], epoch: 31/50, iter: 600/834, loss: 0.29709, lr: 0.453302, top1: 0.65448, throughput: 313.43 | 2022-04-03 11:04:04.577 [rank:2] [train], epoch: 31/50, iter: 600/834, loss: 0.29551, lr: 0.453302, top1: 0.65766, throughput: 313.12 | 2022-04-03 11:04:04.580 [rank:6] [train], epoch: 31/50, iter: 600/834, loss: 0.29779, lr: 0.453302, top1: 0.65245, throughput: 313.34 | 2022-04-03 11:04:04.508 [rank:0] [train], epoch: 31/50, iter: 600/834, loss: 0.29567, lr: 0.453302, top1: 0.65750, throughput: 313.43 | 2022-04-03 11:04:04.605 [rank:7] [train], epoch: 31/50, iter: 600/834, loss: 0.29828, lr: 0.453302, top1: 0.65630, throughput: 312.98 | 2022-04-03 11:04:04.639 [rank:0] [train], epoch: 31/50, iter: 700/834, loss: 0.29413, lr: 0.448033, top1: 0.66193, throughput: 313.37 | 2022-04-03 11:05:05.876 [rank:6] [train], epoch: 31/50, iter: 700/834, loss: 0.29418, lr: 0.448033, top1: 0.66062, throughput: 312.83 | 2022-04-03 11:05:05.883 [rank:7] [train], epoch: 31/50, iter: 700/834, loss: 0.29677, lr: 0.448033, top1: 0.65740, throughput: 313.44 | 2022-04-03 11:05:05.893 [rank:1] [train], epoch: 31/50, iter: 700/834, loss: 0.29770, lr: 0.448033, top1: 0.65344, throughput: 312.94 | 2022-04-03 11:05:05.897 [rank:5] [train], epoch: 31/50, iter: 700/834, loss: 0.29534, lr: 0.448033, top1: 0.65885, throughput: 312.79 | 2022-04-03 11:05:05.902 [rank:3] [train], epoch: 31/50, iter: 700/834, loss: 0.29602, lr: 0.448033, top1: 0.65630, throughput: 312.79 | 2022-04-03 11:05:05.916 [rank:2] [train], epoch: 31/50, iter: 700/834, loss: 0.29577, lr: 0.448033, top1: 0.65755, throughput: 313.03 | 2022-04-03 11:05:05.916 [rank:4] [train], epoch: 31/50, iter: 700/834, loss: 0.29568, lr: 0.448033, top1: 0.65911, throughput: 312.97 | 2022-04-03 11:05:05.924 [rank:5] [train], epoch: 31/50, iter: 800/834, loss: 0.29537, lr: 0.442783, top1: 0.66120, throughput: 313.56 | 2022-04-03 11:06:07.135 [rank:2] [train], epoch: 31/50, iter: 800/834, loss: 0.29614, lr: 0.442783, top1: 0.65464, throughput: 313.61 | 2022-04-03 11:06:07.138 [rank:1] [train], epoch: 31/50, iter: 800/834, loss: 0.29600, lr: 0.442783, top1: 0.65896, throughput: 313.40 | 2022-04-03 11:06:07.160 [rank:6] [train], epoch: 31/50, iter: 800/834, loss: 0.29510, lr: 0.442783, top1: 0.66031, throughput: 313.18 | 2022-04-03 11:06:07.191 [rank:7] [train], epoch: 31/50, iter: 800/834, loss: 0.29620, lr: 0.442783, top1: 0.65474, throughput: 313.22 | 2022-04-03 11:06:07.192 [rank:3] [train], epoch: 31/50, iter: 800/834, loss: 0.29778, lr: 0.442783, top1: 0.65010, throughput: 313.24 | 2022-04-03 11:06:07.211 [rank:0] [train], epoch: 31/50, iter: 800/834, loss: 0.29469, lr: 0.442783, top1: 0.66078, throughput: 313.02 | 2022-04-03 11:06:07.214 [rank:4] [train], epoch: 31/50, iter: 800/834, loss: 0.29547, lr: 0.442783, top1: 0.65807, throughput: 313.62 | 2022-04-03 11:06:07.144 [rank:5] [train], epoch: 31/50, iter: 834/834, loss: 0.29867, lr: 0.441002, top1: 0.65594, throughput: 308.40 | 2022-04-03 11:06:28.302 [rank:3] [train], epoch: 31/50, iter: 834/834, loss: 0.29404, lr: 0.441002, top1: 0.66452, throughput: 309.50 | 2022-04-03 11:06:28.303 [rank:4] [train], epoch: 31/50, iter: 834/834, loss: 0.29782, lr: 0.441002, top1: 0.65028, throughput: 308.50 | 2022-04-03 11:06:28.305 [rank:1] [train], epoch: 31/50, iter: 834/834, loss: 0.29440, lr: 0.441002, top1: 0.65977, throughput: 308.71 | 2022-04-03 11:06:28.306 [rank:2] [train], epoch: 31/50, iter: 834/834, loss: 0.29940, lr: 0.441002, top1: 0.65257, throughput: 308.30 | 2022-04-03 11:06:28.312 [rank:0] [train], epoch: 31/50, iter: 834/834, loss: 0.29902, lr: 0.441002, top1: 0.65885, throughput: 309.38 | 2022-04-03 11:06:28.314 [rank:6] [train], epoch: 31/50, iter: 834/834, loss: 0.29519, lr: 0.441002, top1: 0.65993, throughput: 309.03 | 2022-04-03 11:06:28.315 [rank:7] [train], epoch: 31/50, iter: 834/834, loss: 0.29283, lr: 0.441002, top1: 0.66360, throughput: 308.91 | 2022-04-03 11:06:28.324 [rank:0] [eval], epoch: 31/50, iter: 125/125, loss: 0.00000, lr: 0.441002, top1: 0.68400, throughput: 488.45 | 2022-04-03 11:06:41.109 [rank:1] [eval], epoch: 31/50, iter: 125/125, loss: 0.00000, lr: 0.441002, top1: 0.68016, throughput: 488.05 | 2022-04-03 11:06:41.112 [rank:2] [eval], epoch: 31/50, iter: 125/125, loss: 0.00000, lr: 0.441002, top1: 0.66928, throughput: 487.68 | 2022-04-03 11:06:41.128 [rank:5] [eval], epoch: 31/50, iter: 125/125, loss: 0.00000, lr: 0.441002, top1: 0.66624, throughput: 487.29 | 2022-04-03 11:06:41.128 [rank:7] [eval], epoch: 31/50, iter: 125/125, loss: 0.00000, lr: 0.441002, top1: 0.67360, throughput: 487.82 | 2022-04-03 11:06:41.137 [rank:6] [eval], epoch: 31/50, iter: 125/125, loss: 0.00000, lr: 0.441002, top1: 0.67616, throughput: 487.37 | 2022-04-03 11:06:41.139 [rank:3] [eval], epoch: 31/50, iter: 125/125, loss: 0.00000, lr: 0.441002, top1: 0.66768, throughput: 486.28 | 2022-04-03 11:06:41.156 [rank:4] [eval], epoch: 31/50, iter: 125/125, loss: 0.00000, lr: 0.441002, top1: 0.67184, throughput: 486.32 | 2022-04-03 11:06:41.157 [rank:1] [train], epoch: 32/50, iter: 100/834, loss: 0.29203, lr: 0.435776, top1: 0.66359, throughput: 311.99 | 2022-04-03 11:07:42.653 [rank:3] [train], epoch: 32/50, iter: 100/834, loss: 0.28701, lr: 0.435776, top1: 0.67630, throughput: 312.17 | 2022-04-03 11:07:42.660 [rank:0] [train], epoch: 32/50, iter: 100/834, loss: 0.29085, lr: 0.435776, top1: 0.66609, throughput: 311.79 | 2022-04-03 11:07:42.689 [rank:5] [train], epoch: 32/50, iter: 100/834, loss: 0.29145, lr: 0.435776, top1: 0.66583, throughput: 311.81 | 2022-04-03 11:07:42.705 [rank:7] [train], epoch: 32/50, iter: 100/834, loss: 0.29396, lr: 0.435776, top1: 0.66245, throughput: 311.83 | 2022-04-03 11:07:42.708 [rank:4] [train], epoch: 32/50, iter: 100/834, loss: 0.29257, lr: 0.435776, top1: 0.66505, throughput: 311.89 | 2022-04-03 11:07:42.718 [rank:6] [train], epoch: 32/50, iter: 100/834, loss: 0.28916, lr: 0.435776, top1: 0.67068, throughput: 312.14 | 2022-04-03 11:07:42.651 [rank:2] [train], epoch: 32/50, iter: 100/834, loss: 0.29210, lr: 0.435776, top1: 0.66396, throughput: 311.63 | 2022-04-03 11:07:42.739 [rank:3] [train], epoch: 32/50, iter: 200/834, loss: 0.29003, lr: 0.430568, top1: 0.66964, throughput: 309.45 | 2022-04-03 11:08:44.707 [rank:5] [train], epoch: 32/50, iter: 200/834, loss: 0.29105, lr: 0.430568, top1: 0.66453, throughput: 309.64 | 2022-04-03 11:08:44.713 [rank:7] [train], epoch: 32/50, iter: 200/834, loss: 0.29274, lr: 0.430568, top1: 0.66490, throughput: 309.63 | 2022-04-03 11:08:44.718 [rank:2] [train], epoch: 32/50, iter: 200/834, loss: 0.29304, lr: 0.430568, top1: 0.66411, throughput: 309.64 | 2022-04-03 11:08:44.747 [rank:6] [train], epoch: 32/50, iter: 200/834, loss: 0.29189, lr: 0.430568, top1: 0.66411, throughput: 309.10 | 2022-04-03 11:08:44.766 [rank:4] [train], epoch: 32/50, iter: 200/834, loss: 0.29088, lr: 0.430568, top1: 0.66385, throughput: 309.42 | 2022-04-03 11:08:44.769 [rank:1] [train], epoch: 32/50, iter: 200/834, loss: 0.29114, lr: 0.430568, top1: 0.66526, throughput: 309.04 | 2022-04-03 11:08:44.780 [rank:0] [train], epoch: 32/50, iter: 200/834, loss: 0.28718, lr: 0.430568, top1: 0.67568, throughput: 309.63 | 2022-04-03 11:08:44.698 [rank:1] [train], epoch: 32/50, iter: 300/834, loss: 0.29212, lr: 0.425380, top1: 0.66615, throughput: 313.12 | 2022-04-03 11:09:46.099 [rank:6] [train], epoch: 32/50, iter: 300/834, loss: 0.29379, lr: 0.425380, top1: 0.66052, throughput: 312.95 | 2022-04-03 11:09:46.118 [rank:3] [train], epoch: 32/50, iter: 300/834, loss: 0.28947, lr: 0.425380, top1: 0.66734, throughput: 312.57 | 2022-04-03 11:09:46.132 [rank:4] [train], epoch: 32/50, iter: 300/834, loss: 0.29194, lr: 0.425380, top1: 0.66635, throughput: 312.86 | 2022-04-03 11:09:46.138 [rank:7] [train], epoch: 32/50, iter: 300/834, loss: 0.29226, lr: 0.425380, top1: 0.66729, throughput: 312.60 | 2022-04-03 11:09:46.138 [rank:0] [train], epoch: 32/50, iter: 300/834, loss: 0.29288, lr: 0.425380, top1: 0.66208, throughput: 312.44 | 2022-04-03 11:09:46.151 [rank:5] [train], epoch: 32/50, iter: 300/834, loss: 0.29126, lr: 0.425380, top1: 0.66344, throughput: 312.50 | 2022-04-03 11:09:46.154 [rank:2] [train], epoch: 32/50, iter: 300/834, loss: 0.29007, lr: 0.425380, top1: 0.66729, throughput: 312.59 | 2022-04-03 11:09:46.170 [rank:6] [train], epoch: 32/50, iter: 400/834, loss: 0.29103, lr: 0.420212, top1: 0.66786, throughput: 315.23 | 2022-04-03 11:10:47.026 [rank:7] [train], epoch: 32/50, iter: 400/834, loss: 0.29222, lr: 0.420212, top1: 0.66583, throughput: 315.29 | 2022-04-03 11:10:47.034 [rank:5] [train], epoch: 32/50, iter: 400/834, loss: 0.29497, lr: 0.420212, top1: 0.65568, throughput: 315.25 | 2022-04-03 11:10:47.058 [rank:1] [train], epoch: 32/50, iter: 400/834, loss: 0.29265, lr: 0.420212, top1: 0.66521, throughput: 314.94 | 2022-04-03 11:10:47.064 [rank:4] [train], epoch: 32/50, iter: 400/834, loss: 0.29066, lr: 0.420212, top1: 0.66974, throughput: 315.05 | 2022-04-03 11:10:47.081 [rank:3] [train], epoch: 32/50, iter: 400/834, loss: 0.29113, lr: 0.420212, top1: 0.66594, throughput: 315.00 | 2022-04-03 11:10:47.084 [rank:2] [train], epoch: 32/50, iter: 400/834, loss: 0.29225, lr: 0.420212, top1: 0.66667, throughput: 315.04 | 2022-04-03 11:10:47.114 [rank:0] [train], epoch: 32/50, iter: 400/834, loss: 0.29176, lr: 0.420212, top1: 0.66307, throughput: 314.91 | 2022-04-03 11:10:47.120 [rank:4] [train], epoch: 32/50, iter: 500/834, loss: 0.29175, lr: 0.415063, top1: 0.66312, throughput: 312.58 | 2022-04-03 11:11:48.505 [rank:3] [train], epoch: 32/50, iter: 500/834, loss: 0.29114, lr: 0.415063, top1: 0.66573, throughput: 312.59 | 2022-04-03 11:11:48.506 [rank:5] [train], epoch: 32/50, iter: 500/834, loss: 0.29264, lr: 0.415063, top1: 0.66104, throughput: 312.36 | 2022-04-03 11:11:48.525 [rank:1] [train], epoch: 32/50, iter: 500/834, loss: 0.29024, lr: 0.415063, top1: 0.66859, throughput: 312.39 | 2022-04-03 11:11:48.525 [rank:6] [train], epoch: 32/50, iter: 500/834, loss: 0.29320, lr: 0.415063, top1: 0.65880, throughput: 312.19 | 2022-04-03 11:11:48.527 [rank:0] [train], epoch: 32/50, iter: 500/834, loss: 0.29691, lr: 0.415063, top1: 0.65729, throughput: 312.58 | 2022-04-03 11:11:48.544 [rank:7] [train], epoch: 32/50, iter: 500/834, loss: 0.29184, lr: 0.415063, top1: 0.66323, throughput: 312.14 | 2022-04-03 11:11:48.545 [rank:2] [train], epoch: 32/50, iter: 500/834, loss: 0.29198, lr: 0.415063, top1: 0.66609, throughput: 312.55 | 2022-04-03 11:11:48.545 [rank:1] [train], epoch: 32/50, iter: 600/834, loss: 0.29483, lr: 0.409934, top1: 0.65594, throughput: 313.74 | 2022-04-03 11:12:49.724 [rank:5] [train], epoch: 32/50, iter: 600/834, loss: 0.29257, lr: 0.409934, top1: 0.66516, throughput: 313.69 | 2022-04-03 11:12:49.732 [rank:4] [train], epoch: 32/50, iter: 600/834, loss: 0.29584, lr: 0.409934, top1: 0.65708, throughput: 313.38 | 2022-04-03 11:12:49.772 [rank:3] [train], epoch: 32/50, iter: 600/834, loss: 0.29177, lr: 0.409934, top1: 0.66630, throughput: 313.34 | 2022-04-03 11:12:49.780 [rank:2] [train], epoch: 32/50, iter: 600/834, loss: 0.29396, lr: 0.409934, top1: 0.66062, throughput: 313.53 | 2022-04-03 11:12:49.782 [rank:0] [train], epoch: 32/50, iter: 600/834, loss: 0.28999, lr: 0.409934, top1: 0.66823, throughput: 313.49 | 2022-04-03 11:12:49.790 [rank:7] [train], epoch: 32/50, iter: 600/834, loss: 0.29111, lr: 0.409934, top1: 0.66781, throughput: 313.47 | 2022-04-03 11:12:49.795 [rank:6] [train], epoch: 32/50, iter: 600/834, loss: 0.29094, lr: 0.409934, top1: 0.66698, throughput: 313.32 | 2022-04-03 11:12:49.805 [rank:6] [train], epoch: 32/50, iter: 700/834, loss: 0.29246, lr: 0.404826, top1: 0.66125, throughput: 313.46 | 2022-04-03 11:13:51.057 [rank:3] [train], epoch: 32/50, iter: 700/834, loss: 0.29344, lr: 0.404826, top1: 0.66250, throughput: 313.26 | 2022-04-03 11:13:51.072 [rank:7] [train], epoch: 32/50, iter: 700/834, loss: 0.29089, lr: 0.404826, top1: 0.66677, throughput: 313.33 | 2022-04-03 11:13:51.072 [rank:1] [train], epoch: 32/50, iter: 700/834, loss: 0.29229, lr: 0.404826, top1: 0.66432, throughput: 312.97 | 2022-04-03 11:13:51.072 [rank:5] [train], epoch: 32/50, iter: 700/834, loss: 0.29411, lr: 0.404826, top1: 0.66026, throughput: 312.98 | 2022-04-03 11:13:51.078 [rank:0] [train], epoch: 32/50, iter: 700/834, loss: 0.29433, lr: 0.404826, top1: 0.65818, throughput: 313.20 | 2022-04-03 11:13:51.092 [rank:2] [train], epoch: 32/50, iter: 700/834, loss: 0.29108, lr: 0.404826, top1: 0.66724, throughput: 313.16 | 2022-04-03 11:13:51.093 [rank:4] [train], epoch: 32/50, iter: 700/834, loss: 0.29160, lr: 0.404826, top1: 0.66234, throughput: 312.88 | 2022-04-03 11:13:51.138 [rank:5] [train], epoch: 32/50, iter: 800/834, loss: 0.29116, lr: 0.399738, top1: 0.66854, throughput: 314.36 | 2022-04-03 11:14:52.155 [rank:2] [train], epoch: 32/50, iter: 800/834, loss: 0.29331, lr: 0.399738, top1: 0.66104, throughput: 314.37 | 2022-04-03 11:14:52.167 [rank:6] [train], epoch: 32/50, iter: 800/834, loss: 0.29308, lr: 0.399738, top1: 0.66255, throughput: 314.08 | 2022-04-03 11:14:52.189 [rank:1] [train], epoch: 32/50, iter: 800/834, loss: 0.29237, lr: 0.399738, top1: 0.66406, throughput: 314.14 | 2022-04-03 11:14:52.191 [rank:0] [train], epoch: 32/50, iter: 800/834, loss: 0.29292, lr: 0.399738, top1: 0.66016, throughput: 314.25 | 2022-04-03 11:14:52.191 [rank:7] [train], epoch: 32/50, iter: 800/834, loss: 0.29038, lr: 0.399738, top1: 0.66562, throughput: 314.12 | 2022-04-03 11:14:52.196 [rank:3] [train], epoch: 32/50, iter: 800/834, loss: 0.29252, lr: 0.399738, top1: 0.66604, throughput: 314.11 | 2022-04-03 11:14:52.197 [rank:4] [train], epoch: 32/50, iter: 800/834, loss: 0.29041, lr: 0.399738, top1: 0.67115, throughput: 314.65 | 2022-04-03 11:14:52.159 [rank:1] [train], epoch: 32/50, iter: 834/834, loss: 0.28884, lr: 0.398013, top1: 0.67111, throughput: 312.66 | 2022-04-03 11:15:13.070 [rank:0] [train], epoch: 32/50, iter: 834/834, loss: 0.29222, lr: 0.398013, top1: 0.66988, throughput: 312.63 | 2022-04-03 11:15:13.072 [rank:6] [train], epoch: 32/50, iter: 834/834, loss: 0.29661, lr: 0.398013, top1: 0.65395, throughput: 312.55 | 2022-04-03 11:15:13.075 [rank:2] [train], epoch: 32/50, iter: 834/834, loss: 0.28754, lr: 0.398013, top1: 0.67800, throughput: 312.23 | 2022-04-03 11:15:13.075 [rank:3] [train], epoch: 32/50, iter: 834/834, loss: 0.29278, lr: 0.398013, top1: 0.66161, throughput: 312.66 | 2022-04-03 11:15:13.076 [rank:7] [train], epoch: 32/50, iter: 834/834, loss: 0.28878, lr: 0.398013, top1: 0.66697, throughput: 312.61 | 2022-04-03 11:15:13.078 [rank:5] [train], epoch: 32/50, iter: 834/834, loss: 0.29149, lr: 0.398013, top1: 0.66314, throughput: 311.93 | 2022-04-03 11:15:13.083 [rank:4] [train], epoch: 32/50, iter: 834/834, loss: 0.29667, lr: 0.398013, top1: 0.65334, throughput: 311.95 | 2022-04-03 11:15:13.085 [rank:0] [eval], epoch: 32/50, iter: 125/125, loss: 0.00000, lr: 0.398013, top1: 0.68160, throughput: 481.58 | 2022-04-03 11:15:26.050 [rank:1] [eval], epoch: 32/50, iter: 125/125, loss: 0.00000, lr: 0.398013, top1: 0.67680, throughput: 481.26 | 2022-04-03 11:15:26.057 [rank:3] [eval], epoch: 32/50, iter: 125/125, loss: 0.00000, lr: 0.398013, top1: 0.67552, throughput: 481.33 | 2022-04-03 11:15:26.060 [rank:5] [eval], epoch: 32/50, iter: 125/125, loss: 0.00000, lr: 0.398013, top1: 0.67504, throughput: 481.32 | 2022-04-03 11:15:26.068 [rank:2] [eval], epoch: 32/50, iter: 125/125, loss: 0.00000, lr: 0.398013, top1: 0.67536, throughput: 480.94 | 2022-04-03 11:15:26.070 [rank:6] [eval], epoch: 32/50, iter: 125/125, loss: 0.00000, lr: 0.398013, top1: 0.68288, throughput: 480.70 | 2022-04-03 11:15:26.077 [rank:7] [eval], epoch: 32/50, iter: 125/125, loss: 0.00000, lr: 0.398013, top1: 0.68128, throughput: 480.71 | 2022-04-03 11:15:26.079 [rank:4] [eval], epoch: 32/50, iter: 125/125, loss: 0.00000, lr: 0.398013, top1: 0.66848, throughput: 480.24 | 2022-04-03 11:15:26.099 [rank:2] [train], epoch: 33/50, iter: 100/834, loss: 0.28624, lr: 0.392953, top1: 0.67865, throughput: 314.95 | 2022-04-03 11:16:27.032 [rank:6] [train], epoch: 33/50, iter: 100/834, loss: 0.28377, lr: 0.392953, top1: 0.68375, throughput: 314.73 | 2022-04-03 11:16:27.081 [rank:1] [train], epoch: 33/50, iter: 100/834, loss: 0.28431, lr: 0.392953, top1: 0.68130, throughput: 314.60 | 2022-04-03 11:16:27.086 [rank:5] [train], epoch: 33/50, iter: 100/834, loss: 0.28652, lr: 0.392953, top1: 0.67943, throughput: 314.60 | 2022-04-03 11:16:27.098 [rank:3] [train], epoch: 33/50, iter: 100/834, loss: 0.28447, lr: 0.392953, top1: 0.68078, throughput: 314.55 | 2022-04-03 11:16:27.100 [rank:4] [train], epoch: 33/50, iter: 100/834, loss: 0.28545, lr: 0.392953, top1: 0.67922, throughput: 314.75 | 2022-04-03 11:16:27.101 [rank:7] [train], epoch: 33/50, iter: 100/834, loss: 0.28912, lr: 0.392953, top1: 0.67104, throughput: 314.59 | 2022-04-03 11:16:27.112 [rank:0] [train], epoch: 33/50, iter: 100/834, loss: 0.28820, lr: 0.392953, top1: 0.67344, throughput: 314.75 | 2022-04-03 11:16:27.051 [rank:6] [train], epoch: 33/50, iter: 200/834, loss: 0.28942, lr: 0.387915, top1: 0.67094, throughput: 313.04 | 2022-04-03 11:17:28.415 [rank:2] [train], epoch: 33/50, iter: 200/834, loss: 0.28995, lr: 0.387915, top1: 0.67125, throughput: 312.74 | 2022-04-03 11:17:28.425 [rank:1] [train], epoch: 33/50, iter: 200/834, loss: 0.28448, lr: 0.387915, top1: 0.68125, throughput: 312.99 | 2022-04-03 11:17:28.430 [rank:3] [train], epoch: 33/50, iter: 200/834, loss: 0.28813, lr: 0.387915, top1: 0.67167, throughput: 313.04 | 2022-04-03 11:17:28.434 [rank:5] [train], epoch: 33/50, iter: 200/834, loss: 0.28903, lr: 0.387915, top1: 0.67156, throughput: 312.88 | 2022-04-03 11:17:28.464 [rank:4] [train], epoch: 33/50, iter: 200/834, loss: 0.28775, lr: 0.387915, top1: 0.67339, throughput: 312.83 | 2022-04-03 11:17:28.476 [rank:7] [train], epoch: 33/50, iter: 200/834, loss: 0.28747, lr: 0.387915, top1: 0.67370, throughput: 312.85 | 2022-04-03 11:17:28.482 [rank:0] [train], epoch: 33/50, iter: 200/834, loss: 0.28468, lr: 0.387915, top1: 0.67875, throughput: 312.49 | 2022-04-03 11:17:28.493 [rank:7] [train], epoch: 33/50, iter: 300/834, loss: 0.28913, lr: 0.382898, top1: 0.66734, throughput: 312.95 | 2022-04-03 11:18:29.833 [rank:4] [train], epoch: 33/50, iter: 300/834, loss: 0.28549, lr: 0.382898, top1: 0.67703, throughput: 312.90 | 2022-04-03 11:18:29.837 [rank:6] [train], epoch: 33/50, iter: 300/834, loss: 0.28701, lr: 0.382898, top1: 0.67516, throughput: 312.57 | 2022-04-03 11:18:29.842 [rank:1] [train], epoch: 33/50, iter: 300/834, loss: 0.28909, lr: 0.382898, top1: 0.67422, throughput: 312.46 | 2022-04-03 11:18:29.877 [rank:3] [train], epoch: 33/50, iter: 300/834, loss: 0.28448, lr: 0.382898, top1: 0.67911, throughput: 312.48 | 2022-04-03 11:18:29.878 [rank:2] [train], epoch: 33/50, iter: 300/834, loss: 0.28844, lr: 0.382898, top1: 0.67151, throughput: 312.40 | 2022-04-03 11:18:29.884 [rank:0] [train], epoch: 33/50, iter: 300/834, loss: 0.28639, lr: 0.382898, top1: 0.67547, throughput: 312.71 | 2022-04-03 11:18:29.891 [rank:5] [train], epoch: 33/50, iter: 300/834, loss: 0.28806, lr: 0.382898, top1: 0.67250, throughput: 312.55 | 2022-04-03 11:18:29.895 [rank:5] [train], epoch: 33/50, iter: 400/834, loss: 0.28883, lr: 0.377903, top1: 0.67151, throughput: 311.93 | 2022-04-03 11:19:31.446 [rank:7] [train], epoch: 33/50, iter: 400/834, loss: 0.28854, lr: 0.377903, top1: 0.67380, throughput: 311.58 | 2022-04-03 11:19:31.454 [rank:2] [train], epoch: 33/50, iter: 400/834, loss: 0.28991, lr: 0.377903, top1: 0.66635, throughput: 311.77 | 2022-04-03 11:19:31.467 [rank:0] [train], epoch: 33/50, iter: 400/834, loss: 0.28678, lr: 0.377903, top1: 0.67109, throughput: 311.68 | 2022-04-03 11:19:31.492 [rank:3] [train], epoch: 33/50, iter: 400/834, loss: 0.28825, lr: 0.377903, top1: 0.67062, throughput: 311.60 | 2022-04-03 11:19:31.495 [rank:6] [train], epoch: 33/50, iter: 400/834, loss: 0.28853, lr: 0.377903, top1: 0.67115, throughput: 311.41 | 2022-04-03 11:19:31.496 [rank:1] [train], epoch: 33/50, iter: 400/834, loss: 0.28479, lr: 0.377903, top1: 0.67802, throughput: 311.56 | 2022-04-03 11:19:31.502 [rank:4] [train], epoch: 33/50, iter: 400/834, loss: 0.28883, lr: 0.377903, top1: 0.67135, throughput: 311.18 | 2022-04-03 11:19:31.538 [rank:2] [train], epoch: 33/50, iter: 500/834, loss: 0.28879, lr: 0.372930, top1: 0.67198, throughput: 313.21 | 2022-04-03 11:20:32.767 [rank:7] [train], epoch: 33/50, iter: 500/834, loss: 0.28766, lr: 0.372930, top1: 0.67391, throughput: 313.00 | 2022-04-03 11:20:32.797 [rank:0] [train], epoch: 33/50, iter: 500/834, loss: 0.29082, lr: 0.372930, top1: 0.67042, throughput: 313.19 | 2022-04-03 11:20:32.797 [rank:5] [train], epoch: 33/50, iter: 500/834, loss: 0.28846, lr: 0.372930, top1: 0.66901, throughput: 312.95 | 2022-04-03 11:20:32.798 [rank:1] [train], epoch: 33/50, iter: 500/834, loss: 0.28911, lr: 0.372930, top1: 0.67344, throughput: 313.20 | 2022-04-03 11:20:32.804 [rank:6] [train], epoch: 33/50, iter: 500/834, loss: 0.28745, lr: 0.372930, top1: 0.67578, throughput: 313.16 | 2022-04-03 11:20:32.806 [rank:3] [train], epoch: 33/50, iter: 500/834, loss: 0.28922, lr: 0.372930, top1: 0.67375, throughput: 313.02 | 2022-04-03 11:20:32.833 [rank:4] [train], epoch: 33/50, iter: 500/834, loss: 0.28988, lr: 0.372930, top1: 0.67052, throughput: 313.59 | 2022-04-03 11:20:32.765 [rank:7] [train], epoch: 33/50, iter: 600/834, loss: 0.28732, lr: 0.367980, top1: 0.67469, throughput: 312.68 | 2022-04-03 11:21:34.202 [rank:6] [train], epoch: 33/50, iter: 600/834, loss: 0.28920, lr: 0.367980, top1: 0.67104, throughput: 312.69 | 2022-04-03 11:21:34.209 [rank:2] [train], epoch: 33/50, iter: 600/834, loss: 0.28642, lr: 0.367980, top1: 0.67432, throughput: 312.40 | 2022-04-03 11:21:34.226 [rank:3] [train], epoch: 33/50, iter: 600/834, loss: 0.29042, lr: 0.367980, top1: 0.66776, throughput: 312.64 | 2022-04-03 11:21:34.245 [rank:4] [train], epoch: 33/50, iter: 600/834, loss: 0.28721, lr: 0.367980, top1: 0.67630, throughput: 312.28 | 2022-04-03 11:21:34.248 [rank:1] [train], epoch: 33/50, iter: 600/834, loss: 0.28456, lr: 0.367980, top1: 0.68063, throughput: 312.38 | 2022-04-03 11:21:34.267 [rank:5] [train], epoch: 33/50, iter: 600/834, loss: 0.28873, lr: 0.367980, top1: 0.66938, throughput: 312.34 | 2022-04-03 11:21:34.270 [rank:0] [train], epoch: 33/50, iter: 600/834, loss: 0.28548, lr: 0.367980, top1: 0.67823, throughput: 312.21 | 2022-04-03 11:21:34.294 [rank:5] [train], epoch: 33/50, iter: 700/834, loss: 0.28949, lr: 0.363052, top1: 0.66823, throughput: 312.64 | 2022-04-03 11:22:35.683 [rank:0] [train], epoch: 33/50, iter: 700/834, loss: 0.28855, lr: 0.363052, top1: 0.67245, throughput: 312.68 | 2022-04-03 11:22:35.699 [rank:6] [train], epoch: 33/50, iter: 700/834, loss: 0.29018, lr: 0.363052, top1: 0.66641, throughput: 312.13 | 2022-04-03 11:22:35.721 [rank:3] [train], epoch: 33/50, iter: 700/834, loss: 0.28877, lr: 0.363052, top1: 0.67042, throughput: 312.28 | 2022-04-03 11:22:35.728 [rank:2] [train], epoch: 33/50, iter: 700/834, loss: 0.29069, lr: 0.363052, top1: 0.66594, throughput: 312.08 | 2022-04-03 11:22:35.750 [rank:4] [train], epoch: 33/50, iter: 700/834, loss: 0.28982, lr: 0.363052, top1: 0.66755, throughput: 312.17 | 2022-04-03 11:22:35.753 [rank:1] [train], epoch: 33/50, iter: 700/834, loss: 0.29133, lr: 0.363052, top1: 0.66448, throughput: 312.20 | 2022-04-03 11:22:35.766 [rank:7] [train], epoch: 33/50, iter: 700/834, loss: 0.29006, lr: 0.363052, top1: 0.66682, throughput: 311.79 | 2022-04-03 11:22:35.781 [rank:7] [train], epoch: 33/50, iter: 800/834, loss: 0.28955, lr: 0.358147, top1: 0.66740, throughput: 312.44 | 2022-04-03 11:23:37.234 [rank:2] [train], epoch: 33/50, iter: 800/834, loss: 0.29026, lr: 0.358147, top1: 0.66906, throughput: 312.11 | 2022-04-03 11:23:37.267 [rank:4] [train], epoch: 33/50, iter: 800/834, loss: 0.28690, lr: 0.358147, top1: 0.67339, throughput: 312.09 | 2022-04-03 11:23:37.273 [rank:5] [train], epoch: 33/50, iter: 800/834, loss: 0.28863, lr: 0.358147, top1: 0.67365, throughput: 311.71 | 2022-04-03 11:23:37.280 [rank:1] [train], epoch: 33/50, iter: 800/834, loss: 0.29025, lr: 0.358147, top1: 0.66901, throughput: 312.12 | 2022-04-03 11:23:37.281 [rank:3] [train], epoch: 33/50, iter: 800/834, loss: 0.28896, lr: 0.358147, top1: 0.67229, throughput: 311.89 | 2022-04-03 11:23:37.288 [rank:0] [train], epoch: 33/50, iter: 800/834, loss: 0.28758, lr: 0.358147, top1: 0.67245, throughput: 311.72 | 2022-04-03 11:23:37.293 [rank:6] [train], epoch: 33/50, iter: 800/834, loss: 0.28699, lr: 0.358147, top1: 0.67411, throughput: 311.84 | 2022-04-03 11:23:37.291 [rank:6] [train], epoch: 33/50, iter: 834/834, loss: 0.28493, lr: 0.356485, top1: 0.67586, throughput: 313.80 | 2022-04-03 11:23:58.095 [rank:1] [train], epoch: 33/50, iter: 834/834, loss: 0.29060, lr: 0.356485, top1: 0.67693, throughput: 313.58 | 2022-04-03 11:23:58.099 [rank:2] [train], epoch: 33/50, iter: 834/834, loss: 0.29267, lr: 0.356485, top1: 0.67126, throughput: 313.36 | 2022-04-03 11:23:58.100 [rank:4] [train], epoch: 33/50, iter: 834/834, loss: 0.29044, lr: 0.356485, top1: 0.66896, throughput: 313.38 | 2022-04-03 11:23:58.104 [rank:7] [train], epoch: 33/50, iter: 834/834, loss: 0.28715, lr: 0.356485, top1: 0.67295, throughput: 312.79 | 2022-04-03 11:23:58.104 [rank:3] [train], epoch: 33/50, iter: 834/834, loss: 0.28710, lr: 0.356485, top1: 0.67678, throughput: 313.61 | 2022-04-03 11:23:58.104 [rank:0] [train], epoch: 33/50, iter: 834/834, loss: 0.29020, lr: 0.356485, top1: 0.66636, throughput: 313.53 | 2022-04-03 11:23:58.114 [rank:5] [train], epoch: 33/50, iter: 834/834, loss: 0.28646, lr: 0.356485, top1: 0.67157, throughput: 312.81 | 2022-04-03 11:23:58.149 [rank:0] [eval], epoch: 33/50, iter: 125/125, loss: 0.00000, lr: 0.356485, top1: 0.69424, throughput: 481.43 | 2022-04-03 11:24:11.096 [rank:1] [eval], epoch: 33/50, iter: 125/125, loss: 0.00000, lr: 0.356485, top1: 0.68544, throughput: 480.72 | 2022-04-03 11:24:11.100 [rank:2] [eval], epoch: 33/50, iter: 125/125, loss: 0.00000, lr: 0.356485, top1: 0.68176, throughput: 480.30 | 2022-04-03 11:24:11.112 [rank:5] [eval], epoch: 33/50, iter: 125/125, loss: 0.00000, lr: 0.356485, top1: 0.68048, throughput: 481.96 | 2022-04-03 11:24:11.117 [rank:7] [eval], epoch: 33/50, iter: 125/125, loss: 0.00000, lr: 0.356485, top1: 0.68752, throughput: 480.27 | 2022-04-03 11:24:11.117 [rank:3] [eval], epoch: 33/50, iter: 125/125, loss: 0.00000, lr: 0.356485, top1: 0.68336, throughput: 480.14 | 2022-04-03 11:24:11.121 [rank:6] [eval], epoch: 33/50, iter: 125/125, loss: 0.00000, lr: 0.356485, top1: 0.69056, throughput: 479.21 | 2022-04-03 11:24:11.137 [rank:4] [eval], epoch: 33/50, iter: 125/125, loss: 0.00000, lr: 0.356485, top1: 0.68624, throughput: 479.50 | 2022-04-03 11:24:11.138 [rank:3] [train], epoch: 34/50, iter: 100/834, loss: 0.28318, lr: 0.351612, top1: 0.68016, throughput: 314.38 | 2022-04-03 11:25:12.194 [rank:5] [train], epoch: 34/50, iter: 100/834, loss: 0.28342, lr: 0.351612, top1: 0.68479, throughput: 314.31 | 2022-04-03 11:25:12.204 [rank:1] [train], epoch: 34/50, iter: 100/834, loss: 0.28478, lr: 0.351612, top1: 0.68010, throughput: 314.05 | 2022-04-03 11:25:12.236 [rank:4] [train], epoch: 34/50, iter: 100/834, loss: 0.28397, lr: 0.351612, top1: 0.67922, throughput: 314.19 | 2022-04-03 11:25:12.247 [rank:0] [train], epoch: 34/50, iter: 100/834, loss: 0.28258, lr: 0.351612, top1: 0.68604, throughput: 313.97 | 2022-04-03 11:25:12.248 [rank:2] [train], epoch: 34/50, iter: 100/834, loss: 0.28165, lr: 0.351612, top1: 0.68193, throughput: 314.04 | 2022-04-03 11:25:12.251 [rank:7] [train], epoch: 34/50, iter: 100/834, loss: 0.28316, lr: 0.351612, top1: 0.67839, throughput: 314.07 | 2022-04-03 11:25:12.250 [rank:6] [train], epoch: 34/50, iter: 100/834, loss: 0.28442, lr: 0.351612, top1: 0.67896, throughput: 314.10 | 2022-04-03 11:25:12.263 [rank:7] [train], epoch: 34/50, iter: 200/834, loss: 0.28124, lr: 0.346762, top1: 0.68615, throughput: 313.83 | 2022-04-03 11:26:13.430 [rank:2] [train], epoch: 34/50, iter: 200/834, loss: 0.28665, lr: 0.346762, top1: 0.67620, throughput: 313.82 | 2022-04-03 11:26:13.433 [rank:5] [train], epoch: 34/50, iter: 200/834, loss: 0.28406, lr: 0.346762, top1: 0.68260, throughput: 313.52 | 2022-04-03 11:26:13.445 [rank:1] [train], epoch: 34/50, iter: 200/834, loss: 0.28386, lr: 0.346762, top1: 0.67740, throughput: 313.61 | 2022-04-03 11:26:13.459 [rank:3] [train], epoch: 34/50, iter: 200/834, loss: 0.28312, lr: 0.346762, top1: 0.68500, throughput: 313.39 | 2022-04-03 11:26:13.459 [rank:6] [train], epoch: 34/50, iter: 200/834, loss: 0.28369, lr: 0.346762, top1: 0.68089, throughput: 313.56 | 2022-04-03 11:26:13.496 [rank:0] [train], epoch: 34/50, iter: 200/834, loss: 0.28210, lr: 0.346762, top1: 0.68302, throughput: 313.38 | 2022-04-03 11:26:13.516 [rank:4] [train], epoch: 34/50, iter: 200/834, loss: 0.28241, lr: 0.346762, top1: 0.68354, throughput: 313.27 | 2022-04-03 11:26:13.536 [rank:2] [train], epoch: 34/50, iter: 300/834, loss: 0.28547, lr: 0.341936, top1: 0.67854, throughput: 313.50 | 2022-04-03 11:27:14.677 [rank:1] [train], epoch: 34/50, iter: 300/834, loss: 0.28347, lr: 0.341936, top1: 0.68380, throughput: 313.63 | 2022-04-03 11:27:14.678 [rank:3] [train], epoch: 34/50, iter: 300/834, loss: 0.28615, lr: 0.341936, top1: 0.67672, throughput: 313.63 | 2022-04-03 11:27:14.678 [rank:7] [train], epoch: 34/50, iter: 300/834, loss: 0.28276, lr: 0.341936, top1: 0.68438, throughput: 313.29 | 2022-04-03 11:27:14.715 [rank:6] [train], epoch: 34/50, iter: 300/834, loss: 0.28656, lr: 0.341936, top1: 0.67417, throughput: 313.59 | 2022-04-03 11:27:14.722 [rank:0] [train], epoch: 34/50, iter: 300/834, loss: 0.28276, lr: 0.341936, top1: 0.68135, throughput: 313.60 | 2022-04-03 11:27:14.740 [rank:5] [train], epoch: 34/50, iter: 300/834, loss: 0.28482, lr: 0.341936, top1: 0.68437, throughput: 313.18 | 2022-04-03 11:27:14.752 [rank:4] [train], epoch: 34/50, iter: 300/834, loss: 0.28544, lr: 0.341936, top1: 0.67328, throughput: 314.09 | 2022-04-03 11:27:14.665 [rank:6] [train], epoch: 34/50, iter: 400/834, loss: 0.28415, lr: 0.337134, top1: 0.67708, throughput: 311.36 | 2022-04-03 11:28:16.387 [rank:1] [train], epoch: 34/50, iter: 400/834, loss: 0.28613, lr: 0.337134, top1: 0.67646, throughput: 311.06 | 2022-04-03 11:28:16.402 [rank:5] [train], epoch: 34/50, iter: 400/834, loss: 0.28571, lr: 0.337134, top1: 0.67604, throughput: 311.39 | 2022-04-03 11:28:16.410 [rank:0] [train], epoch: 34/50, iter: 400/834, loss: 0.28425, lr: 0.337134, top1: 0.68281, throughput: 311.25 | 2022-04-03 11:28:16.426 [rank:2] [train], epoch: 34/50, iter: 400/834, loss: 0.28666, lr: 0.337134, top1: 0.67734, throughput: 310.91 | 2022-04-03 11:28:16.432 [rank:4] [train], epoch: 34/50, iter: 400/834, loss: 0.28697, lr: 0.337134, top1: 0.67646, throughput: 310.83 | 2022-04-03 11:28:16.436 [rank:3] [train], epoch: 34/50, iter: 400/834, loss: 0.28314, lr: 0.337134, top1: 0.68458, throughput: 310.86 | 2022-04-03 11:28:16.441 [rank:7] [train], epoch: 34/50, iter: 400/834, loss: 0.28505, lr: 0.337134, top1: 0.67766, throughput: 310.80 | 2022-04-03 11:28:16.491 [rank:6] [train], epoch: 34/50, iter: 500/834, loss: 0.28429, lr: 0.332357, top1: 0.67854, throughput: 311.39 | 2022-04-03 11:29:18.047 [rank:4] [train], epoch: 34/50, iter: 500/834, loss: 0.28519, lr: 0.332357, top1: 0.67724, throughput: 311.56 | 2022-04-03 11:29:18.061 [rank:2] [train], epoch: 34/50, iter: 500/834, loss: 0.28483, lr: 0.332357, top1: 0.68042, throughput: 311.47 | 2022-04-03 11:29:18.074 [rank:0] [train], epoch: 34/50, iter: 500/834, loss: 0.28442, lr: 0.332357, top1: 0.67901, throughput: 311.82 | 2022-04-03 11:29:18.001 [rank:7] [train], epoch: 34/50, iter: 500/834, loss: 0.28411, lr: 0.332357, top1: 0.67719, throughput: 311.69 | 2022-04-03 11:29:18.090 [rank:3] [train], epoch: 34/50, iter: 500/834, loss: 0.28145, lr: 0.332357, top1: 0.68297, throughput: 311.42 | 2022-04-03 11:29:18.095 [rank:5] [train], epoch: 34/50, iter: 500/834, loss: 0.28142, lr: 0.332357, top1: 0.68406, throughput: 311.26 | 2022-04-03 11:29:18.096 [rank:1] [train], epoch: 34/50, iter: 500/834, loss: 0.28564, lr: 0.332357, top1: 0.67625, throughput: 311.16 | 2022-04-03 11:29:18.106 [rank:5] [train], epoch: 34/50, iter: 600/834, loss: 0.28470, lr: 0.327604, top1: 0.67823, throughput: 313.48 | 2022-04-03 11:30:19.343 [rank:3] [train], epoch: 34/50, iter: 600/834, loss: 0.28434, lr: 0.327604, top1: 0.68047, throughput: 313.32 | 2022-04-03 11:30:19.373 [rank:4] [train], epoch: 34/50, iter: 600/834, loss: 0.28451, lr: 0.327604, top1: 0.68047, throughput: 313.14 | 2022-04-03 11:30:19.374 [rank:0] [train], epoch: 34/50, iter: 600/834, loss: 0.28584, lr: 0.327604, top1: 0.67693, throughput: 312.84 | 2022-04-03 11:30:19.375 [rank:6] [train], epoch: 34/50, iter: 600/834, loss: 0.28493, lr: 0.327604, top1: 0.67937, throughput: 313.02 | 2022-04-03 11:30:19.384 [rank:2] [train], epoch: 34/50, iter: 600/834, loss: 0.28524, lr: 0.327604, top1: 0.68026, throughput: 313.15 | 2022-04-03 11:30:19.388 [rank:1] [train], epoch: 34/50, iter: 600/834, loss: 0.28459, lr: 0.327604, top1: 0.68062, throughput: 313.25 | 2022-04-03 11:30:19.398 [rank:7] [train], epoch: 34/50, iter: 600/834, loss: 0.28572, lr: 0.327604, top1: 0.67786, throughput: 313.17 | 2022-04-03 11:30:19.400 [rank:3] [train], epoch: 34/50, iter: 700/834, loss: 0.28264, lr: 0.322876, top1: 0.68255, throughput: 312.75 | 2022-04-03 11:31:20.764 [rank:7] [train], epoch: 34/50, iter: 700/834, loss: 0.28314, lr: 0.322876, top1: 0.68286, throughput: 312.86 | 2022-04-03 11:31:20.768 [rank:2] [train], epoch: 34/50, iter: 700/834, loss: 0.28405, lr: 0.322876, top1: 0.68193, throughput: 312.75 | 2022-04-03 11:31:20.779 [rank:6] [train], epoch: 34/50, iter: 700/834, loss: 0.28510, lr: 0.322876, top1: 0.67984, throughput: 312.70 | 2022-04-03 11:31:20.784 [rank:1] [train], epoch: 34/50, iter: 700/834, loss: 0.28419, lr: 0.322876, top1: 0.68021, throughput: 312.76 | 2022-04-03 11:31:20.786 [rank:0] [train], epoch: 34/50, iter: 700/834, loss: 0.28359, lr: 0.322876, top1: 0.68208, throughput: 312.50 | 2022-04-03 11:31:20.815 [rank:5] [train], epoch: 34/50, iter: 700/834, loss: 0.28379, lr: 0.322876, top1: 0.68177, throughput: 312.31 | 2022-04-03 11:31:20.820 [rank:4] [train], epoch: 34/50, iter: 700/834, loss: 0.28599, lr: 0.322876, top1: 0.67760, throughput: 312.47 | 2022-04-03 11:31:20.821 [rank:0] [train], epoch: 34/50, iter: 800/834, loss: 0.28534, lr: 0.318174, top1: 0.67995, throughput: 311.95 | 2022-04-03 11:32:22.363 [rank:5] [train], epoch: 34/50, iter: 800/834, loss: 0.28363, lr: 0.318174, top1: 0.68052, throughput: 311.97 | 2022-04-03 11:32:22.363 [rank:1] [train], epoch: 34/50, iter: 800/834, loss: 0.28357, lr: 0.318174, top1: 0.68188, throughput: 311.74 | 2022-04-03 11:32:22.376 [rank:6] [train], epoch: 34/50, iter: 800/834, loss: 0.28536, lr: 0.318174, top1: 0.67615, throughput: 311.70 | 2022-04-03 11:32:22.383 [rank:7] [train], epoch: 34/50, iter: 800/834, loss: 0.28554, lr: 0.318174, top1: 0.67542, throughput: 311.56 | 2022-04-03 11:32:22.393 [rank:2] [train], epoch: 34/50, iter: 800/834, loss: 0.28400, lr: 0.318174, top1: 0.68073, throughput: 311.40 | 2022-04-03 11:32:22.437 [rank:3] [train], epoch: 34/50, iter: 800/834, loss: 0.28256, lr: 0.318174, top1: 0.68313, throughput: 311.29 | 2022-04-03 11:32:22.442 [rank:4] [train], epoch: 34/50, iter: 800/834, loss: 0.28476, lr: 0.318174, top1: 0.67703, throughput: 312.06 | 2022-04-03 11:32:22.348 [rank:6] [train], epoch: 34/50, iter: 834/834, loss: 0.28269, lr: 0.316581, top1: 0.67907, throughput: 311.43 | 2022-04-03 11:32:43.344 [rank:4] [train], epoch: 34/50, iter: 834/834, loss: 0.28262, lr: 0.316581, top1: 0.68352, throughput: 310.80 | 2022-04-03 11:32:43.352 [rank:2] [train], epoch: 34/50, iter: 834/834, loss: 0.28440, lr: 0.316581, top1: 0.67034, throughput: 312.09 | 2022-04-03 11:32:43.354 [rank:7] [train], epoch: 34/50, iter: 834/834, loss: 0.28272, lr: 0.316581, top1: 0.67999, throughput: 311.44 | 2022-04-03 11:32:43.354 [rank:0] [train], epoch: 34/50, iter: 834/834, loss: 0.29017, lr: 0.316581, top1: 0.66422, throughput: 310.94 | 2022-04-03 11:32:43.357 [rank:1] [train], epoch: 34/50, iter: 834/834, loss: 0.28377, lr: 0.316581, top1: 0.67892, throughput: 311.02 | 2022-04-03 11:32:43.365 [rank:3] [train], epoch: 34/50, iter: 834/834, loss: 0.28555, lr: 0.316581, top1: 0.67785, throughput: 311.81 | 2022-04-03 11:32:43.378 [rank:5] [train], epoch: 34/50, iter: 834/834, loss: 0.28071, lr: 0.316581, top1: 0.68995, throughput: 311.21 | 2022-04-03 11:32:43.339 [rank:0] [eval], epoch: 34/50, iter: 125/125, loss: 0.00000, lr: 0.316581, top1: 0.69408, throughput: 486.39 | 2022-04-03 11:32:56.207 [rank:1] [eval], epoch: 34/50, iter: 125/125, loss: 0.00000, lr: 0.316581, top1: 0.68672, throughput: 486.66 | 2022-04-03 11:32:56.207 [rank:2] [eval], epoch: 34/50, iter: 125/125, loss: 0.00000, lr: 0.316581, top1: 0.68112, throughput: 485.75 | 2022-04-03 11:32:56.220 [rank:5] [eval], epoch: 34/50, iter: 125/125, loss: 0.00000, lr: 0.316581, top1: 0.67680, throughput: 485.09 | 2022-04-03 11:32:56.224 [rank:7] [eval], epoch: 34/50, iter: 125/125, loss: 0.00000, lr: 0.316581, top1: 0.69152, throughput: 485.26 | 2022-04-03 11:32:56.234 [rank:6] [eval], epoch: 34/50, iter: 125/125, loss: 0.00000, lr: 0.316581, top1: 0.68864, throughput: 484.59 | 2022-04-03 11:32:56.242 [rank:3] [eval], epoch: 34/50, iter: 125/125, loss: 0.00000, lr: 0.316581, top1: 0.67984, throughput: 485.78 | 2022-04-03 11:32:56.244 [rank:4] [eval], epoch: 34/50, iter: 125/125, loss: 0.00000, lr: 0.316581, top1: 0.68880, throughput: 484.73 | 2022-04-03 11:32:56.245 [rank:5] [train], epoch: 35/50, iter: 100/834, loss: 0.28033, lr: 0.311913, top1: 0.68917, throughput: 314.03 | 2022-04-03 11:33:57.364 [rank:0] [train], epoch: 35/50, iter: 100/834, loss: 0.27689, lr: 0.311913, top1: 0.69646, throughput: 313.74 | 2022-04-03 11:33:57.405 [rank:6] [train], epoch: 35/50, iter: 100/834, loss: 0.27616, lr: 0.311913, top1: 0.69745, throughput: 313.90 | 2022-04-03 11:33:57.408 [rank:1] [train], epoch: 35/50, iter: 100/834, loss: 0.27662, lr: 0.311913, top1: 0.69625, throughput: 313.71 | 2022-04-03 11:33:57.411 [rank:7] [train], epoch: 35/50, iter: 100/834, loss: 0.27937, lr: 0.311913, top1: 0.68932, throughput: 313.82 | 2022-04-03 11:33:57.416 [rank:4] [train], epoch: 35/50, iter: 100/834, loss: 0.27788, lr: 0.311913, top1: 0.69187, throughput: 313.87 | 2022-04-03 11:33:57.417 [rank:3] [train], epoch: 35/50, iter: 100/834, loss: 0.27891, lr: 0.311913, top1: 0.69339, throughput: 313.86 | 2022-04-03 11:33:57.418 [rank:2] [train], epoch: 35/50, iter: 100/834, loss: 0.28178, lr: 0.311913, top1: 0.68417, throughput: 314.04 | 2022-04-03 11:33:57.358 [rank:5] [train], epoch: 35/50, iter: 200/834, loss: 0.27919, lr: 0.307271, top1: 0.68922, throughput: 311.97 | 2022-04-03 11:34:58.908 [rank:2] [train], epoch: 35/50, iter: 200/834, loss: 0.27908, lr: 0.307271, top1: 0.68901, throughput: 311.85 | 2022-04-03 11:34:58.926 [rank:7] [train], epoch: 35/50, iter: 200/834, loss: 0.28097, lr: 0.307271, top1: 0.68578, throughput: 312.14 | 2022-04-03 11:34:58.926 [rank:3] [train], epoch: 35/50, iter: 200/834, loss: 0.28067, lr: 0.307271, top1: 0.68792, throughput: 312.03 | 2022-04-03 11:34:58.951 [rank:1] [train], epoch: 35/50, iter: 200/834, loss: 0.28075, lr: 0.307271, top1: 0.68854, throughput: 311.97 | 2022-04-03 11:34:58.956 [rank:4] [train], epoch: 35/50, iter: 200/834, loss: 0.27826, lr: 0.307271, top1: 0.69422, throughput: 311.97 | 2022-04-03 11:34:58.962 [rank:6] [train], epoch: 35/50, iter: 200/834, loss: 0.27753, lr: 0.307271, top1: 0.69245, throughput: 311.88 | 2022-04-03 11:34:58.971 [rank:0] [train], epoch: 35/50, iter: 200/834, loss: 0.28176, lr: 0.307271, top1: 0.68323, throughput: 311.72 | 2022-04-03 11:34:58.998 [rank:3] [train], epoch: 35/50, iter: 300/834, loss: 0.28028, lr: 0.302655, top1: 0.68641, throughput: 313.63 | 2022-04-03 11:36:00.170 [rank:2] [train], epoch: 35/50, iter: 300/834, loss: 0.27947, lr: 0.302655, top1: 0.68906, throughput: 313.39 | 2022-04-03 11:36:00.191 [rank:1] [train], epoch: 35/50, iter: 300/834, loss: 0.28331, lr: 0.302655, top1: 0.67932, throughput: 313.54 | 2022-04-03 11:36:00.191 [rank:5] [train], epoch: 35/50, iter: 300/834, loss: 0.28081, lr: 0.302655, top1: 0.68568, throughput: 313.16 | 2022-04-03 11:36:00.219 [rank:4] [train], epoch: 35/50, iter: 300/834, loss: 0.28008, lr: 0.302655, top1: 0.68760, throughput: 313.41 | 2022-04-03 11:36:00.224 [rank:6] [train], epoch: 35/50, iter: 300/834, loss: 0.27764, lr: 0.302655, top1: 0.69312, throughput: 313.44 | 2022-04-03 11:36:00.226 [rank:0] [train], epoch: 35/50, iter: 300/834, loss: 0.28124, lr: 0.302655, top1: 0.68552, throughput: 313.58 | 2022-04-03 11:36:00.227 [rank:7] [train], epoch: 35/50, iter: 300/834, loss: 0.28139, lr: 0.302655, top1: 0.68307, throughput: 313.07 | 2022-04-03 11:36:00.253 [rank:6] [train], epoch: 35/50, iter: 400/834, loss: 0.27860, lr: 0.298065, top1: 0.69349, throughput: 314.34 | 2022-04-03 11:37:01.306 [rank:4] [train], epoch: 35/50, iter: 400/834, loss: 0.28107, lr: 0.298065, top1: 0.68859, throughput: 314.28 | 2022-04-03 11:37:01.317 [rank:3] [train], epoch: 35/50, iter: 400/834, loss: 0.28202, lr: 0.298065, top1: 0.68349, throughput: 313.82 | 2022-04-03 11:37:01.352 [rank:5] [train], epoch: 35/50, iter: 400/834, loss: 0.28123, lr: 0.298065, top1: 0.68708, throughput: 314.04 | 2022-04-03 11:37:01.357 [rank:2] [train], epoch: 35/50, iter: 400/834, loss: 0.28230, lr: 0.298065, top1: 0.68521, throughput: 313.89 | 2022-04-03 11:37:01.359 [rank:1] [train], epoch: 35/50, iter: 400/834, loss: 0.28328, lr: 0.298065, top1: 0.68151, throughput: 313.88 | 2022-04-03 11:37:01.361 [rank:0] [train], epoch: 35/50, iter: 400/834, loss: 0.28280, lr: 0.298065, top1: 0.68141, throughput: 314.06 | 2022-04-03 11:37:01.362 [rank:7] [train], epoch: 35/50, iter: 400/834, loss: 0.27953, lr: 0.298065, top1: 0.68812, throughput: 314.12 | 2022-04-03 11:37:01.377 [rank:1] [train], epoch: 35/50, iter: 500/834, loss: 0.28389, lr: 0.293502, top1: 0.67745, throughput: 312.67 | 2022-04-03 11:38:02.768 [rank:2] [train], epoch: 35/50, iter: 500/834, loss: 0.28140, lr: 0.293502, top1: 0.68521, throughput: 312.64 | 2022-04-03 11:38:02.772 [rank:6] [train], epoch: 35/50, iter: 500/834, loss: 0.28195, lr: 0.293502, top1: 0.68365, throughput: 312.36 | 2022-04-03 11:38:02.774 [rank:3] [train], epoch: 35/50, iter: 500/834, loss: 0.27918, lr: 0.293502, top1: 0.68807, throughput: 312.52 | 2022-04-03 11:38:02.789 [rank:5] [train], epoch: 35/50, iter: 500/834, loss: 0.28101, lr: 0.293502, top1: 0.68646, throughput: 312.54 | 2022-04-03 11:38:02.788 [rank:7] [train], epoch: 35/50, iter: 500/834, loss: 0.27965, lr: 0.293502, top1: 0.69094, throughput: 312.63 | 2022-04-03 11:38:02.791 [rank:0] [train], epoch: 35/50, iter: 500/834, loss: 0.27927, lr: 0.293502, top1: 0.68911, throughput: 312.52 | 2022-04-03 11:38:02.798 [rank:4] [train], epoch: 35/50, iter: 500/834, loss: 0.28212, lr: 0.293502, top1: 0.68187, throughput: 312.55 | 2022-04-03 11:38:02.747 [rank:2] [train], epoch: 35/50, iter: 600/834, loss: 0.28177, lr: 0.288966, top1: 0.68276, throughput: 311.62 | 2022-04-03 11:39:04.385 [rank:1] [train], epoch: 35/50, iter: 600/834, loss: 0.27953, lr: 0.288966, top1: 0.69177, throughput: 311.51 | 2022-04-03 11:39:04.404 [rank:0] [train], epoch: 35/50, iter: 600/834, loss: 0.28074, lr: 0.288966, top1: 0.68802, throughput: 311.64 | 2022-04-03 11:39:04.406 [rank:6] [train], epoch: 35/50, iter: 600/834, loss: 0.27737, lr: 0.288966, top1: 0.69281, throughput: 311.45 | 2022-04-03 11:39:04.422 [rank:3] [train], epoch: 35/50, iter: 600/834, loss: 0.28016, lr: 0.288966, top1: 0.68760, throughput: 311.51 | 2022-04-03 11:39:04.424 [rank:5] [train], epoch: 35/50, iter: 600/834, loss: 0.28041, lr: 0.288966, top1: 0.68901, throughput: 311.48 | 2022-04-03 11:39:04.430 [rank:4] [train], epoch: 35/50, iter: 600/834, loss: 0.27949, lr: 0.288966, top1: 0.68620, throughput: 311.25 | 2022-04-03 11:39:04.434 [rank:7] [train], epoch: 35/50, iter: 600/834, loss: 0.28075, lr: 0.288966, top1: 0.68865, throughput: 311.30 | 2022-04-03 11:39:04.467 [rank:1] [train], epoch: 35/50, iter: 700/834, loss: 0.27846, lr: 0.284457, top1: 0.69271, throughput: 313.65 | 2022-04-03 11:40:05.620 [rank:5] [train], epoch: 35/50, iter: 700/834, loss: 0.27845, lr: 0.284457, top1: 0.69229, throughput: 313.70 | 2022-04-03 11:40:05.636 [rank:0] [train], epoch: 35/50, iter: 700/834, loss: 0.27945, lr: 0.284457, top1: 0.68781, throughput: 313.57 | 2022-04-03 11:40:05.637 [rank:2] [train], epoch: 35/50, iter: 700/834, loss: 0.27962, lr: 0.284457, top1: 0.68922, throughput: 313.45 | 2022-04-03 11:40:05.638 [rank:6] [train], epoch: 35/50, iter: 700/834, loss: 0.28028, lr: 0.284457, top1: 0.68547, throughput: 313.56 | 2022-04-03 11:40:05.654 [rank:3] [train], epoch: 35/50, iter: 700/834, loss: 0.28189, lr: 0.284457, top1: 0.68646, throughput: 313.48 | 2022-04-03 11:40:05.672 [rank:4] [train], epoch: 35/50, iter: 700/834, loss: 0.27965, lr: 0.284457, top1: 0.68875, throughput: 313.94 | 2022-04-03 11:40:05.592 [rank:7] [train], epoch: 35/50, iter: 700/834, loss: 0.28054, lr: 0.284457, top1: 0.69026, throughput: 313.59 | 2022-04-03 11:40:05.693 [rank:0] [train], epoch: 35/50, iter: 800/834, loss: 0.28003, lr: 0.279976, top1: 0.68953, throughput: 311.89 | 2022-04-03 11:41:07.197 [rank:5] [train], epoch: 35/50, iter: 800/834, loss: 0.28036, lr: 0.279976, top1: 0.68870, throughput: 311.86 | 2022-04-03 11:41:07.203 [rank:3] [train], epoch: 35/50, iter: 800/834, loss: 0.28198, lr: 0.279976, top1: 0.68297, throughput: 312.01 | 2022-04-03 11:41:07.210 [rank:2] [train], epoch: 35/50, iter: 800/834, loss: 0.28024, lr: 0.279976, top1: 0.68937, throughput: 311.81 | 2022-04-03 11:41:07.214 [rank:4] [train], epoch: 35/50, iter: 800/834, loss: 0.28026, lr: 0.279976, top1: 0.68870, throughput: 311.51 | 2022-04-03 11:41:07.228 [rank:6] [train], epoch: 35/50, iter: 800/834, loss: 0.28212, lr: 0.279976, top1: 0.68380, throughput: 311.73 | 2022-04-03 11:41:07.246 [rank:7] [train], epoch: 35/50, iter: 800/834, loss: 0.28078, lr: 0.279976, top1: 0.68755, throughput: 311.92 | 2022-04-03 11:41:07.247 [rank:1] [train], epoch: 35/50, iter: 800/834, loss: 0.27879, lr: 0.279976, top1: 0.69172, throughput: 311.50 | 2022-04-03 11:41:07.257 [rank:5] [train], epoch: 35/50, iter: 834/834, loss: 0.27907, lr: 0.278458, top1: 0.68627, throughput: 312.27 | 2022-04-03 11:41:28.108 [rank:6] [train], epoch: 35/50, iter: 834/834, loss: 0.28155, lr: 0.278458, top1: 0.68398, throughput: 312.90 | 2022-04-03 11:41:28.109 [rank:4] [train], epoch: 35/50, iter: 834/834, loss: 0.28106, lr: 0.278458, top1: 0.67754, throughput: 312.58 | 2022-04-03 11:41:28.113 [rank:0] [train], epoch: 35/50, iter: 834/834, loss: 0.28206, lr: 0.278458, top1: 0.67892, throughput: 312.05 | 2022-04-03 11:41:28.117 [rank:1] [train], epoch: 35/50, iter: 834/834, loss: 0.27834, lr: 0.278458, top1: 0.68796, throughput: 312.88 | 2022-04-03 11:41:28.121 [rank:7] [train], epoch: 35/50, iter: 834/834, loss: 0.28362, lr: 0.278458, top1: 0.68352, throughput: 312.71 | 2022-04-03 11:41:28.122 [rank:2] [train], epoch: 35/50, iter: 834/834, loss: 0.28556, lr: 0.278458, top1: 0.67662, throughput: 312.12 | 2022-04-03 11:41:28.129 [rank:3] [train], epoch: 35/50, iter: 834/834, loss: 0.28313, lr: 0.278458, top1: 0.67923, throughput: 312.05 | 2022-04-03 11:41:28.129 [rank:0] [eval], epoch: 35/50, iter: 125/125, loss: 0.00000, lr: 0.278458, top1: 0.69328, throughput: 495.87 | 2022-04-03 11:41:40.721 [rank:1] [eval], epoch: 35/50, iter: 125/125, loss: 0.00000, lr: 0.278458, top1: 0.69184, throughput: 495.90 | 2022-04-03 11:41:40.724 [rank:2] [eval], epoch: 35/50, iter: 125/125, loss: 0.00000, lr: 0.278458, top1: 0.68688, throughput: 496.10 | 2022-04-03 11:41:40.727 [rank:5] [eval], epoch: 35/50, iter: 125/125, loss: 0.00000, lr: 0.278458, top1: 0.67392, throughput: 494.79 | 2022-04-03 11:41:40.739 [rank:4] [eval], epoch: 35/50, iter: 125/125, loss: 0.00000, lr: 0.278458, top1: 0.67984, throughput: 494.51 | 2022-04-03 11:41:40.751 [rank:7] [eval], epoch: 35/50, iter: 125/125, loss: 0.00000, lr: 0.278458, top1: 0.69088, throughput: 494.86 | 2022-04-03 11:41:40.752 [rank:6] [eval], epoch: 35/50, iter: 125/125, loss: 0.00000, lr: 0.278458, top1: 0.68832, throughput: 493.94 | 2022-04-03 11:41:40.762 [rank:3] [eval], epoch: 35/50, iter: 125/125, loss: 0.00000, lr: 0.278458, top1: 0.67904, throughput: 494.67 | 2022-04-03 11:41:40.764 [rank:1] [train], epoch: 36/50, iter: 100/834, loss: 0.27558, lr: 0.274014, top1: 0.69448, throughput: 311.74 | 2022-04-03 11:42:42.314 [rank:4] [train], epoch: 36/50, iter: 100/834, loss: 0.27048, lr: 0.274014, top1: 0.70547, throughput: 311.88 | 2022-04-03 11:42:42.314 [rank:6] [train], epoch: 36/50, iter: 100/834, loss: 0.27353, lr: 0.274014, top1: 0.69937, throughput: 311.88 | 2022-04-03 11:42:42.325 [rank:7] [train], epoch: 36/50, iter: 100/834, loss: 0.27359, lr: 0.274014, top1: 0.70146, throughput: 311.77 | 2022-04-03 11:42:42.335 [rank:0] [train], epoch: 36/50, iter: 100/834, loss: 0.27341, lr: 0.274014, top1: 0.70484, throughput: 311.60 | 2022-04-03 11:42:42.340 [rank:3] [train], epoch: 36/50, iter: 100/834, loss: 0.27670, lr: 0.274014, top1: 0.69406, throughput: 311.80 | 2022-04-03 11:42:42.341 [rank:5] [train], epoch: 36/50, iter: 100/834, loss: 0.27438, lr: 0.274014, top1: 0.70104, throughput: 311.62 | 2022-04-03 11:42:42.353 [rank:2] [train], epoch: 36/50, iter: 100/834, loss: 0.27400, lr: 0.274014, top1: 0.70016, throughput: 311.51 | 2022-04-03 11:42:42.363 [rank:7] [train], epoch: 36/50, iter: 200/834, loss: 0.27391, lr: 0.269598, top1: 0.70161, throughput: 313.07 | 2022-04-03 11:43:43.663 [rank:5] [train], epoch: 36/50, iter: 200/834, loss: 0.27588, lr: 0.269598, top1: 0.69786, throughput: 313.13 | 2022-04-03 11:43:43.670 [rank:4] [train], epoch: 36/50, iter: 200/834, loss: 0.27393, lr: 0.269598, top1: 0.70276, throughput: 312.91 | 2022-04-03 11:43:43.674 [rank:2] [train], epoch: 36/50, iter: 200/834, loss: 0.27485, lr: 0.269598, top1: 0.69901, throughput: 313.02 | 2022-04-03 11:43:43.701 [rank:1] [train], epoch: 36/50, iter: 200/834, loss: 0.27645, lr: 0.269598, top1: 0.69375, throughput: 312.75 | 2022-04-03 11:43:43.705 [rank:3] [train], epoch: 36/50, iter: 200/834, loss: 0.27386, lr: 0.269598, top1: 0.69703, throughput: 312.88 | 2022-04-03 11:43:43.706 [rank:0] [train], epoch: 36/50, iter: 200/834, loss: 0.27407, lr: 0.269598, top1: 0.69958, throughput: 312.83 | 2022-04-03 11:43:43.716 [rank:6] [train], epoch: 36/50, iter: 200/834, loss: 0.27398, lr: 0.269598, top1: 0.69755, throughput: 312.53 | 2022-04-03 11:43:43.758 [rank:2] [train], epoch: 36/50, iter: 300/834, loss: 0.27567, lr: 0.265210, top1: 0.70005, throughput: 313.74 | 2022-04-03 11:44:44.898 [rank:0] [train], epoch: 36/50, iter: 300/834, loss: 0.27548, lr: 0.265210, top1: 0.69964, throughput: 313.79 | 2022-04-03 11:44:44.903 [rank:7] [train], epoch: 36/50, iter: 300/834, loss: 0.27842, lr: 0.265210, top1: 0.69219, throughput: 313.46 | 2022-04-03 11:44:44.915 [rank:6] [train], epoch: 36/50, iter: 300/834, loss: 0.27727, lr: 0.265210, top1: 0.69531, throughput: 313.93 | 2022-04-03 11:44:44.918 [rank:1] [train], epoch: 36/50, iter: 300/834, loss: 0.27335, lr: 0.265210, top1: 0.70021, throughput: 313.63 | 2022-04-03 11:44:44.924 [rank:3] [train], epoch: 36/50, iter: 300/834, loss: 0.27711, lr: 0.265210, top1: 0.69667, throughput: 313.56 | 2022-04-03 11:44:44.939 [rank:5] [train], epoch: 36/50, iter: 300/834, loss: 0.27649, lr: 0.265210, top1: 0.69292, throughput: 313.28 | 2022-04-03 11:44:44.957 [rank:4] [train], epoch: 36/50, iter: 300/834, loss: 0.27576, lr: 0.265210, top1: 0.69964, throughput: 313.28 | 2022-04-03 11:44:44.961 [rank:6] [train], epoch: 36/50, iter: 400/834, loss: 0.27546, lr: 0.260851, top1: 0.69844, throughput: 312.39 | 2022-04-03 11:45:46.380 [rank:1] [train], epoch: 36/50, iter: 400/834, loss: 0.27622, lr: 0.260851, top1: 0.69328, throughput: 312.34 | 2022-04-03 11:45:46.396 [rank:3] [train], epoch: 36/50, iter: 400/834, loss: 0.27600, lr: 0.260851, top1: 0.69760, throughput: 312.40 | 2022-04-03 11:45:46.398 [rank:0] [train], epoch: 36/50, iter: 400/834, loss: 0.27687, lr: 0.260851, top1: 0.69370, throughput: 312.11 | 2022-04-03 11:45:46.420 [rank:4] [train], epoch: 36/50, iter: 400/834, loss: 0.27558, lr: 0.260851, top1: 0.69943, throughput: 312.31 | 2022-04-03 11:45:46.439 [rank:5] [train], epoch: 36/50, iter: 400/834, loss: 0.27606, lr: 0.260851, top1: 0.69531, throughput: 312.23 | 2022-04-03 11:45:46.451 [rank:7] [train], epoch: 36/50, iter: 400/834, loss: 0.27434, lr: 0.260851, top1: 0.69792, throughput: 311.91 | 2022-04-03 11:45:46.471 [rank:2] [train], epoch: 36/50, iter: 400/834, loss: 0.27869, lr: 0.260851, top1: 0.69005, throughput: 312.35 | 2022-04-03 11:45:46.368 [rank:1] [train], epoch: 36/50, iter: 500/834, loss: 0.27605, lr: 0.256520, top1: 0.69708, throughput: 311.81 | 2022-04-03 11:46:47.972 [rank:6] [train], epoch: 36/50, iter: 500/834, loss: 0.27542, lr: 0.256520, top1: 0.69948, throughput: 311.63 | 2022-04-03 11:46:47.993 [rank:3] [train], epoch: 36/50, iter: 500/834, loss: 0.27770, lr: 0.256520, top1: 0.69333, throughput: 311.69 | 2022-04-03 11:46:47.998 [rank:0] [train], epoch: 36/50, iter: 500/834, loss: 0.27784, lr: 0.256520, top1: 0.69120, throughput: 311.78 | 2022-04-03 11:46:48.002 [rank:2] [train], epoch: 36/50, iter: 500/834, loss: 0.27793, lr: 0.256520, top1: 0.69021, throughput: 311.50 | 2022-04-03 11:46:48.005 [rank:7] [train], epoch: 36/50, iter: 500/834, loss: 0.27527, lr: 0.256520, top1: 0.69552, throughput: 312.00 | 2022-04-03 11:46:48.010 [rank:4] [train], epoch: 36/50, iter: 500/834, loss: 0.27481, lr: 0.256520, top1: 0.69714, throughput: 311.83 | 2022-04-03 11:46:48.011 [rank:5] [train], epoch: 36/50, iter: 500/834, loss: 0.27653, lr: 0.256520, top1: 0.69672, throughput: 311.89 | 2022-04-03 11:46:48.011 [rank:5] [train], epoch: 36/50, iter: 600/834, loss: 0.27828, lr: 0.252219, top1: 0.69672, throughput: 314.74 | 2022-04-03 11:47:49.015 [rank:3] [train], epoch: 36/50, iter: 600/834, loss: 0.27619, lr: 0.252219, top1: 0.69318, throughput: 314.61 | 2022-04-03 11:47:49.025 [rank:6] [train], epoch: 36/50, iter: 600/834, loss: 0.27623, lr: 0.252219, top1: 0.69839, throughput: 314.51 | 2022-04-03 11:47:49.041 [rank:1] [train], epoch: 36/50, iter: 600/834, loss: 0.27789, lr: 0.252219, top1: 0.69302, throughput: 314.30 | 2022-04-03 11:47:49.060 [rank:2] [train], epoch: 36/50, iter: 600/834, loss: 0.27733, lr: 0.252219, top1: 0.69000, throughput: 314.46 | 2022-04-03 11:47:49.061 [rank:0] [train], epoch: 36/50, iter: 600/834, loss: 0.27716, lr: 0.252219, top1: 0.69057, throughput: 314.33 | 2022-04-03 11:47:49.084 [rank:4] [train], epoch: 36/50, iter: 600/834, loss: 0.27635, lr: 0.252219, top1: 0.69474, throughput: 314.22 | 2022-04-03 11:47:49.116 [rank:7] [train], epoch: 36/50, iter: 600/834, loss: 0.27677, lr: 0.252219, top1: 0.69422, throughput: 314.50 | 2022-04-03 11:47:49.059 [rank:6] [train], epoch: 36/50, iter: 700/834, loss: 0.27655, lr: 0.247946, top1: 0.69411, throughput: 311.40 | 2022-04-03 11:48:50.698 [rank:2] [train], epoch: 36/50, iter: 700/834, loss: 0.27605, lr: 0.247946, top1: 0.69437, throughput: 311.49 | 2022-04-03 11:48:50.700 [rank:1] [train], epoch: 36/50, iter: 700/834, loss: 0.27473, lr: 0.247946, top1: 0.69682, throughput: 311.47 | 2022-04-03 11:48:50.703 [rank:5] [train], epoch: 36/50, iter: 700/834, loss: 0.27392, lr: 0.247946, top1: 0.70453, throughput: 311.19 | 2022-04-03 11:48:50.713 [rank:3] [train], epoch: 36/50, iter: 700/834, loss: 0.27768, lr: 0.247946, top1: 0.69229, throughput: 311.12 | 2022-04-03 11:48:50.739 [rank:0] [train], epoch: 36/50, iter: 700/834, loss: 0.27642, lr: 0.247946, top1: 0.69510, throughput: 311.40 | 2022-04-03 11:48:50.741 [rank:7] [train], epoch: 36/50, iter: 700/834, loss: 0.27629, lr: 0.247946, top1: 0.69724, throughput: 311.26 | 2022-04-03 11:48:50.743 [rank:4] [train], epoch: 36/50, iter: 700/834, loss: 0.27645, lr: 0.247946, top1: 0.69370, throughput: 311.37 | 2022-04-03 11:48:50.778 [rank:7] [train], epoch: 36/50, iter: 800/834, loss: 0.27630, lr: 0.243704, top1: 0.69370, throughput: 314.54 | 2022-04-03 11:49:51.785 [rank:1] [train], epoch: 36/50, iter: 800/834, loss: 0.27667, lr: 0.243704, top1: 0.69698, throughput: 314.25 | 2022-04-03 11:49:51.802 [rank:6] [train], epoch: 36/50, iter: 800/834, loss: 0.27691, lr: 0.243704, top1: 0.69609, throughput: 314.19 | 2022-04-03 11:49:51.808 [rank:2] [train], epoch: 36/50, iter: 800/834, loss: 0.27751, lr: 0.243704, top1: 0.69526, throughput: 314.19 | 2022-04-03 11:49:51.810 [rank:3] [train], epoch: 36/50, iter: 800/834, loss: 0.27633, lr: 0.243704, top1: 0.69615, throughput: 314.29 | 2022-04-03 11:49:51.828 [rank:5] [train], epoch: 36/50, iter: 800/834, loss: 0.27877, lr: 0.243704, top1: 0.68786, throughput: 314.13 | 2022-04-03 11:49:51.834 [rank:4] [train], epoch: 36/50, iter: 800/834, loss: 0.27881, lr: 0.243704, top1: 0.69203, throughput: 314.34 | 2022-04-03 11:49:51.858 [rank:0] [train], epoch: 36/50, iter: 800/834, loss: 0.27938, lr: 0.243704, top1: 0.68849, throughput: 314.08 | 2022-04-03 11:49:51.872 [rank:2] [train], epoch: 36/50, iter: 834/834, loss: 0.27130, lr: 0.242268, top1: 0.70466, throughput: 314.30 | 2022-04-03 11:50:12.580 [rank:1] [train], epoch: 36/50, iter: 834/834, loss: 0.27413, lr: 0.242268, top1: 0.70956, throughput: 314.12 | 2022-04-03 11:50:12.584 [rank:3] [train], epoch: 36/50, iter: 834/834, loss: 0.27433, lr: 0.242268, top1: 0.69945, throughput: 314.41 | 2022-04-03 11:50:12.591 [rank:6] [train], epoch: 36/50, iter: 834/834, loss: 0.27419, lr: 0.242268, top1: 0.69593, throughput: 314.07 | 2022-04-03 11:50:12.594 [rank:7] [train], epoch: 36/50, iter: 834/834, loss: 0.27705, lr: 0.242268, top1: 0.69930, throughput: 313.71 | 2022-04-03 11:50:12.594 [rank:5] [train], epoch: 36/50, iter: 834/834, loss: 0.27590, lr: 0.242268, top1: 0.69715, throughput: 314.40 | 2022-04-03 11:50:12.598 [rank:4] [train], epoch: 36/50, iter: 834/834, loss: 0.27711, lr: 0.242268, top1: 0.68811, throughput: 314.58 | 2022-04-03 11:50:12.609 [rank:0] [train], epoch: 36/50, iter: 834/834, loss: 0.27411, lr: 0.242268, top1: 0.69991, throughput: 314.47 | 2022-04-03 11:50:12.631 [rank:0] [eval], epoch: 36/50, iter: 125/125, loss: 0.00000, lr: 0.242268, top1: 0.70192, throughput: 478.56 | 2022-04-03 11:50:25.691 [rank:1] [eval], epoch: 36/50, iter: 125/125, loss: 0.00000, lr: 0.242268, top1: 0.69952, throughput: 476.52 | 2022-04-03 11:50:25.700 [rank:2] [eval], epoch: 36/50, iter: 125/125, loss: 0.00000, lr: 0.242268, top1: 0.69472, throughput: 475.97 | 2022-04-03 11:50:25.711 [rank:5] [eval], epoch: 36/50, iter: 125/125, loss: 0.00000, lr: 0.242268, top1: 0.69712, throughput: 476.44 | 2022-04-03 11:50:25.716 [rank:4] [eval], epoch: 36/50, iter: 125/125, loss: 0.00000, lr: 0.242268, top1: 0.69984, throughput: 476.80 | 2022-04-03 11:50:25.717 [rank:7] [eval], epoch: 36/50, iter: 125/125, loss: 0.00000, lr: 0.242268, top1: 0.71232, throughput: 476.25 | 2022-04-03 11:50:25.718 [rank:3] [eval], epoch: 36/50, iter: 125/125, loss: 0.00000, lr: 0.242268, top1: 0.70016, throughput: 475.56 | 2022-04-03 11:50:25.733 [rank:6] [eval], epoch: 36/50, iter: 125/125, loss: 0.00000, lr: 0.242268, top1: 0.70672, throughput: 475.57 | 2022-04-03 11:50:25.736 [rank:7] [train], epoch: 37/50, iter: 100/834, loss: 0.27532, lr: 0.238065, top1: 0.69901, throughput: 314.29 | 2022-04-03 11:51:26.808 [rank:3] [train], epoch: 37/50, iter: 100/834, loss: 0.26730, lr: 0.238065, top1: 0.71479, throughput: 314.32 | 2022-04-03 11:51:26.817 [rank:0] [train], epoch: 37/50, iter: 100/834, loss: 0.27148, lr: 0.238065, top1: 0.70568, throughput: 314.04 | 2022-04-03 11:51:26.831 [rank:6] [train], epoch: 37/50, iter: 100/834, loss: 0.27344, lr: 0.238065, top1: 0.69932, throughput: 314.19 | 2022-04-03 11:51:26.845 [rank:4] [train], epoch: 37/50, iter: 100/834, loss: 0.27240, lr: 0.238065, top1: 0.70422, throughput: 314.09 | 2022-04-03 11:51:26.845 [rank:1] [train], epoch: 37/50, iter: 100/834, loss: 0.27279, lr: 0.238065, top1: 0.70464, throughput: 313.98 | 2022-04-03 11:51:26.850 [rank:5] [train], epoch: 37/50, iter: 100/834, loss: 0.26792, lr: 0.238065, top1: 0.71250, throughput: 314.45 | 2022-04-03 11:51:26.775 [rank:2] [train], epoch: 37/50, iter: 100/834, loss: 0.27191, lr: 0.238065, top1: 0.70375, throughput: 314.38 | 2022-04-03 11:51:26.783 [rank:1] [train], epoch: 37/50, iter: 200/834, loss: 0.26948, lr: 0.233892, top1: 0.70750, throughput: 311.26 | 2022-04-03 11:52:28.534 [rank:2] [train], epoch: 37/50, iter: 200/834, loss: 0.26937, lr: 0.233892, top1: 0.71276, throughput: 310.91 | 2022-04-03 11:52:28.536 [rank:0] [train], epoch: 37/50, iter: 200/834, loss: 0.27124, lr: 0.233892, top1: 0.70198, throughput: 311.11 | 2022-04-03 11:52:28.545 [rank:4] [train], epoch: 37/50, iter: 200/834, loss: 0.27250, lr: 0.233892, top1: 0.70250, throughput: 311.16 | 2022-04-03 11:52:28.549 [rank:3] [train], epoch: 37/50, iter: 200/834, loss: 0.27284, lr: 0.233892, top1: 0.70219, throughput: 310.87 | 2022-04-03 11:52:28.578 [rank:7] [train], epoch: 37/50, iter: 200/834, loss: 0.27415, lr: 0.233892, top1: 0.70401, throughput: 310.79 | 2022-04-03 11:52:28.587 [rank:6] [train], epoch: 37/50, iter: 200/834, loss: 0.27326, lr: 0.233892, top1: 0.70089, throughput: 310.94 | 2022-04-03 11:52:28.592 [rank:5] [train], epoch: 37/50, iter: 200/834, loss: 0.27011, lr: 0.233892, top1: 0.70813, throughput: 310.51 | 2022-04-03 11:52:28.609 [rank:7] [train], epoch: 37/50, iter: 300/834, loss: 0.27121, lr: 0.229750, top1: 0.70688, throughput: 312.75 | 2022-04-03 11:53:29.978 [rank:5] [train], epoch: 37/50, iter: 300/834, loss: 0.27117, lr: 0.229750, top1: 0.70854, throughput: 312.85 | 2022-04-03 11:53:29.980 [rank:6] [train], epoch: 37/50, iter: 300/834, loss: 0.26979, lr: 0.229750, top1: 0.71115, throughput: 312.58 | 2022-04-03 11:53:30.016 [rank:0] [train], epoch: 37/50, iter: 300/834, loss: 0.27196, lr: 0.229750, top1: 0.70635, throughput: 312.32 | 2022-04-03 11:53:30.021 [rank:4] [train], epoch: 37/50, iter: 300/834, loss: 0.27122, lr: 0.229750, top1: 0.70594, throughput: 312.33 | 2022-04-03 11:53:30.022 [rank:2] [train], epoch: 37/50, iter: 300/834, loss: 0.27214, lr: 0.229750, top1: 0.70323, throughput: 312.26 | 2022-04-03 11:53:30.023 [rank:1] [train], epoch: 37/50, iter: 300/834, loss: 0.27249, lr: 0.229750, top1: 0.70167, throughput: 312.19 | 2022-04-03 11:53:30.035 [rank:3] [train], epoch: 37/50, iter: 300/834, loss: 0.27306, lr: 0.229750, top1: 0.69906, throughput: 312.36 | 2022-04-03 11:53:30.045 [rank:6] [train], epoch: 37/50, iter: 400/834, loss: 0.27210, lr: 0.225638, top1: 0.70755, throughput: 314.25 | 2022-04-03 11:54:31.115 [rank:3] [train], epoch: 37/50, iter: 400/834, loss: 0.27457, lr: 0.225638, top1: 0.69974, throughput: 314.33 | 2022-04-03 11:54:31.127 [rank:4] [train], epoch: 37/50, iter: 400/834, loss: 0.26946, lr: 0.225638, top1: 0.70995, throughput: 314.14 | 2022-04-03 11:54:31.141 [rank:2] [train], epoch: 37/50, iter: 400/834, loss: 0.27201, lr: 0.225638, top1: 0.70094, throughput: 314.10 | 2022-04-03 11:54:31.150 [rank:7] [train], epoch: 37/50, iter: 400/834, loss: 0.27169, lr: 0.225638, top1: 0.70505, throughput: 313.86 | 2022-04-03 11:54:31.151 [rank:5] [train], epoch: 37/50, iter: 400/834, loss: 0.27044, lr: 0.225638, top1: 0.70781, throughput: 313.79 | 2022-04-03 11:54:31.168 [rank:1] [train], epoch: 37/50, iter: 400/834, loss: 0.27250, lr: 0.225638, top1: 0.70594, throughput: 314.04 | 2022-04-03 11:54:31.173 [rank:0] [train], epoch: 37/50, iter: 400/834, loss: 0.26986, lr: 0.225638, top1: 0.70563, throughput: 313.88 | 2022-04-03 11:54:31.190 [rank:6] [train], epoch: 37/50, iter: 500/834, loss: 0.27291, lr: 0.221557, top1: 0.70297, throughput: 313.36 | 2022-04-03 11:55:32.386 [rank:3] [train], epoch: 37/50, iter: 500/834, loss: 0.27166, lr: 0.221557, top1: 0.70141, throughput: 313.33 | 2022-04-03 11:55:32.404 [rank:4] [train], epoch: 37/50, iter: 500/834, loss: 0.27014, lr: 0.221557, top1: 0.70979, throughput: 313.40 | 2022-04-03 11:55:32.405 [rank:5] [train], epoch: 37/50, iter: 500/834, loss: 0.27250, lr: 0.221557, top1: 0.70302, throughput: 313.50 | 2022-04-03 11:55:32.412 [rank:2] [train], epoch: 37/50, iter: 500/834, loss: 0.27234, lr: 0.221557, top1: 0.70255, throughput: 313.34 | 2022-04-03 11:55:32.425 [rank:0] [train], epoch: 37/50, iter: 500/834, loss: 0.26932, lr: 0.221557, top1: 0.70849, throughput: 313.53 | 2022-04-03 11:55:32.427 [rank:1] [train], epoch: 37/50, iter: 500/834, loss: 0.27371, lr: 0.221557, top1: 0.69943, throughput: 313.44 | 2022-04-03 11:55:32.428 [rank:7] [train], epoch: 37/50, iter: 500/834, loss: 0.26999, lr: 0.221557, top1: 0.70708, throughput: 313.01 | 2022-04-03 11:55:32.491 [rank:2] [train], epoch: 37/50, iter: 600/834, loss: 0.27389, lr: 0.217507, top1: 0.69755, throughput: 313.91 | 2022-04-03 11:56:33.590 [rank:1] [train], epoch: 37/50, iter: 600/834, loss: 0.27202, lr: 0.217507, top1: 0.70198, throughput: 313.92 | 2022-04-03 11:56:33.590 [rank:3] [train], epoch: 37/50, iter: 600/834, loss: 0.27194, lr: 0.217507, top1: 0.70432, throughput: 313.68 | 2022-04-03 11:56:33.612 [rank:5] [train], epoch: 37/50, iter: 600/834, loss: 0.27236, lr: 0.217507, top1: 0.70234, throughput: 313.66 | 2022-04-03 11:56:33.625 [rank:4] [train], epoch: 37/50, iter: 600/834, loss: 0.27128, lr: 0.217507, top1: 0.70859, throughput: 313.61 | 2022-04-03 11:56:33.627 [rank:6] [train], epoch: 37/50, iter: 600/834, loss: 0.27067, lr: 0.217507, top1: 0.70698, throughput: 313.41 | 2022-04-03 11:56:33.647 [rank:0] [train], epoch: 37/50, iter: 600/834, loss: 0.27340, lr: 0.217507, top1: 0.69953, throughput: 313.60 | 2022-04-03 11:56:33.653 [rank:7] [train], epoch: 37/50, iter: 600/834, loss: 0.27025, lr: 0.217507, top1: 0.70578, throughput: 314.26 | 2022-04-03 11:56:33.587 [rank:6] [train], epoch: 37/50, iter: 700/834, loss: 0.27125, lr: 0.213488, top1: 0.70307, throughput: 312.01 | 2022-04-03 11:57:35.183 [rank:5] [train], epoch: 37/50, iter: 700/834, loss: 0.27045, lr: 0.213488, top1: 0.70536, throughput: 311.85 | 2022-04-03 11:57:35.193 [rank:0] [train], epoch: 37/50, iter: 700/834, loss: 0.27380, lr: 0.213488, top1: 0.70120, throughput: 311.90 | 2022-04-03 11:57:35.211 [rank:7] [train], epoch: 37/50, iter: 700/834, loss: 0.27127, lr: 0.213488, top1: 0.70510, throughput: 311.54 | 2022-04-03 11:57:35.217 [rank:2] [train], epoch: 37/50, iter: 700/834, loss: 0.27357, lr: 0.213488, top1: 0.69948, throughput: 311.52 | 2022-04-03 11:57:35.223 [rank:3] [train], epoch: 37/50, iter: 700/834, loss: 0.27341, lr: 0.213488, top1: 0.70448, throughput: 311.57 | 2022-04-03 11:57:35.236 [rank:4] [train], epoch: 37/50, iter: 700/834, loss: 0.27267, lr: 0.213488, top1: 0.70365, throughput: 311.64 | 2022-04-03 11:57:35.237 [rank:1] [train], epoch: 37/50, iter: 700/834, loss: 0.27264, lr: 0.213488, top1: 0.70021, throughput: 311.32 | 2022-04-03 11:57:35.263 [rank:6] [train], epoch: 37/50, iter: 800/834, loss: 0.27460, lr: 0.209501, top1: 0.70021, throughput: 312.83 | 2022-04-03 11:58:36.557 [rank:3] [train], epoch: 37/50, iter: 800/834, loss: 0.27182, lr: 0.209501, top1: 0.70214, throughput: 313.10 | 2022-04-03 11:58:36.559 [rank:7] [train], epoch: 37/50, iter: 800/834, loss: 0.27452, lr: 0.209501, top1: 0.69724, throughput: 312.94 | 2022-04-03 11:58:36.570 [rank:2] [train], epoch: 37/50, iter: 800/834, loss: 0.27376, lr: 0.209501, top1: 0.70099, throughput: 312.92 | 2022-04-03 11:58:36.580 [rank:4] [train], epoch: 37/50, iter: 800/834, loss: 0.27150, lr: 0.209501, top1: 0.70589, throughput: 312.93 | 2022-04-03 11:58:36.593 [rank:1] [train], epoch: 37/50, iter: 800/834, loss: 0.27261, lr: 0.209501, top1: 0.70120, throughput: 312.95 | 2022-04-03 11:58:36.614 [rank:5] [train], epoch: 37/50, iter: 800/834, loss: 0.27467, lr: 0.209501, top1: 0.70151, throughput: 312.57 | 2022-04-03 11:58:36.619 [rank:0] [train], epoch: 37/50, iter: 800/834, loss: 0.27171, lr: 0.209501, top1: 0.70349, throughput: 312.60 | 2022-04-03 11:58:36.630 [rank:3] [train], epoch: 37/50, iter: 834/834, loss: 0.26851, lr: 0.208152, top1: 0.70956, throughput: 310.15 | 2022-04-03 11:58:57.607 [rank:7] [train], epoch: 37/50, iter: 834/834, loss: 0.26908, lr: 0.208152, top1: 0.71569, throughput: 310.30 | 2022-04-03 11:58:57.608 [rank:0] [train], epoch: 37/50, iter: 834/834, loss: 0.27045, lr: 0.208152, top1: 0.70374, throughput: 311.17 | 2022-04-03 11:58:57.609 [rank:2] [train], epoch: 37/50, iter: 834/834, loss: 0.26948, lr: 0.208152, top1: 0.71140, throughput: 310.37 | 2022-04-03 11:58:57.613 [rank:1] [train], epoch: 37/50, iter: 834/834, loss: 0.27530, lr: 0.208152, top1: 0.70297, throughput: 310.86 | 2022-04-03 11:58:57.614 [rank:4] [train], epoch: 37/50, iter: 834/834, loss: 0.27495, lr: 0.208152, top1: 0.69822, throughput: 310.41 | 2022-04-03 11:58:57.623 [rank:5] [train], epoch: 37/50, iter: 834/834, loss: 0.27361, lr: 0.208152, top1: 0.69715, throughput: 310.28 | 2022-04-03 11:58:57.658 [rank:6] [train], epoch: 37/50, iter: 834/834, loss: 0.27360, lr: 0.208152, top1: 0.70420, throughput: 309.19 | 2022-04-03 11:58:57.670 [rank:0] [eval], epoch: 37/50, iter: 125/125, loss: 0.00000, lr: 0.208152, top1: 0.71136, throughput: 480.20 | 2022-04-03 11:59:10.625 [rank:2] [eval], epoch: 37/50, iter: 125/125, loss: 0.00000, lr: 0.208152, top1: 0.70080, throughput: 480.13 | 2022-04-03 11:59:10.630 [rank:1] [eval], epoch: 37/50, iter: 125/125, loss: 0.00000, lr: 0.208152, top1: 0.71120, throughput: 480.02 | 2022-04-03 11:59:10.634 [rank:4] [eval], epoch: 37/50, iter: 125/125, loss: 0.00000, lr: 0.208152, top1: 0.70176, throughput: 480.30 | 2022-04-03 11:59:10.636 [rank:7] [eval], epoch: 37/50, iter: 125/125, loss: 0.00000, lr: 0.208152, top1: 0.70928, throughput: 479.72 | 2022-04-03 11:59:10.636 [rank:5] [eval], epoch: 37/50, iter: 125/125, loss: 0.00000, lr: 0.208152, top1: 0.70080, throughput: 481.21 | 2022-04-03 11:59:10.647 [rank:6] [eval], epoch: 37/50, iter: 125/125, loss: 0.00000, lr: 0.208152, top1: 0.70864, throughput: 481.17 | 2022-04-03 11:59:10.659 [rank:3] [eval], epoch: 37/50, iter: 125/125, loss: 0.00000, lr: 0.208152, top1: 0.70672, throughput: 478.71 | 2022-04-03 11:59:10.663 [rank:3] [train], epoch: 38/50, iter: 100/834, loss: 0.26661, lr: 0.204207, top1: 0.71490, throughput: 314.20 | 2022-04-03 12:00:11.770 [rank:1] [train], epoch: 38/50, iter: 100/834, loss: 0.26721, lr: 0.204207, top1: 0.71729, throughput: 313.95 | 2022-04-03 12:00:11.790 [rank:5] [train], epoch: 38/50, iter: 100/834, loss: 0.26731, lr: 0.204207, top1: 0.71646, throughput: 313.92 | 2022-04-03 12:00:11.809 [rank:0] [train], epoch: 38/50, iter: 100/834, loss: 0.26600, lr: 0.204207, top1: 0.71219, throughput: 313.80 | 2022-04-03 12:00:11.809 [rank:4] [train], epoch: 38/50, iter: 100/834, loss: 0.26398, lr: 0.204207, top1: 0.72062, throughput: 313.86 | 2022-04-03 12:00:11.810 [rank:6] [train], epoch: 38/50, iter: 100/834, loss: 0.26567, lr: 0.204207, top1: 0.71969, throughput: 313.84 | 2022-04-03 12:00:11.836 [rank:7] [train], epoch: 38/50, iter: 100/834, loss: 0.26585, lr: 0.204207, top1: 0.71500, throughput: 314.12 | 2022-04-03 12:00:11.759 [rank:2] [train], epoch: 38/50, iter: 100/834, loss: 0.26935, lr: 0.204207, top1: 0.71146, throughput: 313.61 | 2022-04-03 12:00:11.853 [rank:6] [train], epoch: 38/50, iter: 200/834, loss: 0.26619, lr: 0.200294, top1: 0.71594, throughput: 314.99 | 2022-04-03 12:01:12.790 [rank:0] [train], epoch: 38/50, iter: 200/834, loss: 0.26645, lr: 0.200294, top1: 0.71505, throughput: 314.84 | 2022-04-03 12:01:12.792 [rank:1] [train], epoch: 38/50, iter: 200/834, loss: 0.26714, lr: 0.200294, top1: 0.71073, throughput: 314.70 | 2022-04-03 12:01:12.802 [rank:3] [train], epoch: 38/50, iter: 200/834, loss: 0.26723, lr: 0.200294, top1: 0.71318, throughput: 314.53 | 2022-04-03 12:01:12.813 [rank:5] [train], epoch: 38/50, iter: 200/834, loss: 0.26787, lr: 0.200294, top1: 0.71172, throughput: 314.65 | 2022-04-03 12:01:12.830 [rank:7] [train], epoch: 38/50, iter: 200/834, loss: 0.26633, lr: 0.200294, top1: 0.71786, throughput: 314.36 | 2022-04-03 12:01:12.835 [rank:2] [train], epoch: 38/50, iter: 200/834, loss: 0.26584, lr: 0.200294, top1: 0.71557, throughput: 314.81 | 2022-04-03 12:01:12.842 [rank:4] [train], epoch: 38/50, iter: 200/834, loss: 0.26797, lr: 0.200294, top1: 0.71411, throughput: 314.56 | 2022-04-03 12:01:12.848 [rank:1] [train], epoch: 38/50, iter: 300/834, loss: 0.26850, lr: 0.196414, top1: 0.70724, throughput: 313.03 | 2022-04-03 12:02:14.138 [rank:5] [train], epoch: 38/50, iter: 300/834, loss: 0.26704, lr: 0.196414, top1: 0.71422, throughput: 313.15 | 2022-04-03 12:02:14.142 [rank:7] [train], epoch: 38/50, iter: 300/834, loss: 0.26799, lr: 0.196414, top1: 0.71510, throughput: 313.18 | 2022-04-03 12:02:14.142 [rank:6] [train], epoch: 38/50, iter: 300/834, loss: 0.26708, lr: 0.196414, top1: 0.71667, throughput: 312.88 | 2022-04-03 12:02:14.156 [rank:4] [train], epoch: 38/50, iter: 300/834, loss: 0.26822, lr: 0.196414, top1: 0.71203, throughput: 313.11 | 2022-04-03 12:02:14.169 [rank:3] [train], epoch: 38/50, iter: 300/834, loss: 0.26683, lr: 0.196414, top1: 0.71755, throughput: 312.92 | 2022-04-03 12:02:14.171 [rank:0] [train], epoch: 38/50, iter: 300/834, loss: 0.26650, lr: 0.196414, top1: 0.72104, throughput: 312.77 | 2022-04-03 12:02:14.180 [rank:2] [train], epoch: 38/50, iter: 300/834, loss: 0.26738, lr: 0.196414, top1: 0.71302, throughput: 312.94 | 2022-04-03 12:02:14.195 [rank:5] [train], epoch: 38/50, iter: 400/834, loss: 0.26692, lr: 0.192566, top1: 0.71583, throughput: 312.68 | 2022-04-03 12:03:15.546 [rank:2] [train], epoch: 38/50, iter: 400/834, loss: 0.26712, lr: 0.192566, top1: 0.71432, throughput: 312.95 | 2022-04-03 12:03:15.546 [rank:6] [train], epoch: 38/50, iter: 400/834, loss: 0.26735, lr: 0.192566, top1: 0.71401, throughput: 312.70 | 2022-04-03 12:03:15.556 [rank:3] [train], epoch: 38/50, iter: 400/834, loss: 0.26920, lr: 0.192566, top1: 0.70958, throughput: 312.78 | 2022-04-03 12:03:15.556 [rank:0] [train], epoch: 38/50, iter: 400/834, loss: 0.26882, lr: 0.192566, top1: 0.70839, throughput: 312.78 | 2022-04-03 12:03:15.565 [rank:7] [train], epoch: 38/50, iter: 400/834, loss: 0.26633, lr: 0.192566, top1: 0.71370, throughput: 312.55 | 2022-04-03 12:03:15.571 [rank:1] [train], epoch: 38/50, iter: 400/834, loss: 0.26801, lr: 0.192566, top1: 0.71469, throughput: 312.50 | 2022-04-03 12:03:15.577 [rank:4] [train], epoch: 38/50, iter: 400/834, loss: 0.26781, lr: 0.192566, top1: 0.71214, throughput: 312.61 | 2022-04-03 12:03:15.587 [rank:4] [train], epoch: 38/50, iter: 500/834, loss: 0.26459, lr: 0.188750, top1: 0.71979, throughput: 313.65 | 2022-04-03 12:04:16.801 [rank:1] [train], epoch: 38/50, iter: 500/834, loss: 0.26553, lr: 0.188750, top1: 0.71849, throughput: 313.59 | 2022-04-03 12:04:16.803 [rank:2] [train], epoch: 38/50, iter: 500/834, loss: 0.26808, lr: 0.188750, top1: 0.71250, throughput: 313.42 | 2022-04-03 12:04:16.807 [rank:6] [train], epoch: 38/50, iter: 500/834, loss: 0.26966, lr: 0.188750, top1: 0.71125, throughput: 313.34 | 2022-04-03 12:04:16.832 [rank:0] [train], epoch: 38/50, iter: 500/834, loss: 0.26646, lr: 0.188750, top1: 0.71844, throughput: 313.37 | 2022-04-03 12:04:16.834 [rank:7] [train], epoch: 38/50, iter: 500/834, loss: 0.26895, lr: 0.188750, top1: 0.71125, throughput: 313.38 | 2022-04-03 12:04:16.840 [rank:3] [train], epoch: 38/50, iter: 500/834, loss: 0.26683, lr: 0.188750, top1: 0.71510, throughput: 313.30 | 2022-04-03 12:04:16.839 [rank:5] [train], epoch: 38/50, iter: 500/834, loss: 0.26298, lr: 0.188750, top1: 0.72187, throughput: 313.11 | 2022-04-03 12:04:16.867 [rank:3] [train], epoch: 38/50, iter: 600/834, loss: 0.26736, lr: 0.184968, top1: 0.71396, throughput: 314.45 | 2022-04-03 12:05:17.898 [rank:6] [train], epoch: 38/50, iter: 600/834, loss: 0.26876, lr: 0.184968, top1: 0.70828, throughput: 314.22 | 2022-04-03 12:05:17.936 [rank:5] [train], epoch: 38/50, iter: 600/834, loss: 0.26956, lr: 0.184968, top1: 0.70635, throughput: 314.31 | 2022-04-03 12:05:17.953 [rank:4] [train], epoch: 38/50, iter: 600/834, loss: 0.26686, lr: 0.184968, top1: 0.71365, throughput: 313.92 | 2022-04-03 12:05:17.964 [rank:1] [train], epoch: 38/50, iter: 600/834, loss: 0.26756, lr: 0.184968, top1: 0.71172, throughput: 313.92 | 2022-04-03 12:05:17.965 [rank:0] [train], epoch: 38/50, iter: 600/834, loss: 0.26808, lr: 0.184968, top1: 0.71083, throughput: 314.03 | 2022-04-03 12:05:17.974 [rank:7] [train], epoch: 38/50, iter: 600/834, loss: 0.26850, lr: 0.184968, top1: 0.71578, throughput: 314.06 | 2022-04-03 12:05:17.974 [rank:2] [train], epoch: 38/50, iter: 600/834, loss: 0.26884, lr: 0.184968, top1: 0.71130, throughput: 314.20 | 2022-04-03 12:05:17.914 [rank:1] [train], epoch: 38/50, iter: 700/834, loss: 0.26777, lr: 0.181218, top1: 0.71354, throughput: 311.95 | 2022-04-03 12:06:19.513 [rank:5] [train], epoch: 38/50, iter: 700/834, loss: 0.27125, lr: 0.181218, top1: 0.70828, throughput: 311.86 | 2022-04-03 12:06:19.519 [rank:2] [train], epoch: 38/50, iter: 700/834, loss: 0.26782, lr: 0.181218, top1: 0.71109, throughput: 311.49 | 2022-04-03 12:06:19.552 [rank:7] [train], epoch: 38/50, iter: 700/834, loss: 0.26770, lr: 0.181218, top1: 0.71380, throughput: 311.79 | 2022-04-03 12:06:19.554 [rank:0] [train], epoch: 38/50, iter: 700/834, loss: 0.27089, lr: 0.181218, top1: 0.70406, throughput: 311.73 | 2022-04-03 12:06:19.566 [rank:6] [train], epoch: 38/50, iter: 700/834, loss: 0.27117, lr: 0.181218, top1: 0.70313, throughput: 311.46 | 2022-04-03 12:06:19.582 [rank:3] [train], epoch: 38/50, iter: 700/834, loss: 0.26797, lr: 0.181218, top1: 0.71036, throughput: 311.19 | 2022-04-03 12:06:19.596 [rank:4] [train], epoch: 38/50, iter: 700/834, loss: 0.26562, lr: 0.181218, top1: 0.71443, throughput: 311.41 | 2022-04-03 12:06:19.618 [rank:4] [train], epoch: 38/50, iter: 800/834, loss: 0.26786, lr: 0.177502, top1: 0.71333, throughput: 312.67 | 2022-04-03 12:07:21.024 [rank:7] [train], epoch: 38/50, iter: 800/834, loss: 0.26608, lr: 0.177502, top1: 0.71438, throughput: 312.33 | 2022-04-03 12:07:21.028 [rank:6] [train], epoch: 38/50, iter: 800/834, loss: 0.26633, lr: 0.177502, top1: 0.71432, throughput: 312.47 | 2022-04-03 12:07:21.029 [rank:2] [train], epoch: 38/50, iter: 800/834, loss: 0.26881, lr: 0.177502, top1: 0.70964, throughput: 312.21 | 2022-04-03 12:07:21.049 [rank:3] [train], epoch: 38/50, iter: 800/834, loss: 0.26879, lr: 0.177502, top1: 0.71005, throughput: 312.39 | 2022-04-03 12:07:21.059 [rank:1] [train], epoch: 38/50, iter: 800/834, loss: 0.26795, lr: 0.177502, top1: 0.70901, throughput: 311.90 | 2022-04-03 12:07:21.072 [rank:5] [train], epoch: 38/50, iter: 800/834, loss: 0.26985, lr: 0.177502, top1: 0.71068, throughput: 311.92 | 2022-04-03 12:07:21.074 [rank:0] [train], epoch: 38/50, iter: 800/834, loss: 0.26610, lr: 0.177502, top1: 0.71828, throughput: 312.13 | 2022-04-03 12:07:21.078 [rank:2] [train], epoch: 38/50, iter: 834/834, loss: 0.26914, lr: 0.176246, top1: 0.70818, throughput: 313.45 | 2022-04-03 12:07:41.875 [rank:1] [train], epoch: 38/50, iter: 834/834, loss: 0.26649, lr: 0.176246, top1: 0.71324, throughput: 313.73 | 2022-04-03 12:07:41.880 [rank:6] [train], epoch: 38/50, iter: 834/834, loss: 0.26770, lr: 0.176246, top1: 0.71599, throughput: 313.04 | 2022-04-03 12:07:41.882 [rank:0] [train], epoch: 38/50, iter: 834/834, loss: 0.26822, lr: 0.176246, top1: 0.71170, throughput: 313.75 | 2022-04-03 12:07:41.884 [rank:7] [train], epoch: 38/50, iter: 834/834, loss: 0.26623, lr: 0.176246, top1: 0.71017, throughput: 312.94 | 2022-04-03 12:07:41.888 [rank:4] [train], epoch: 38/50, iter: 834/834, loss: 0.26233, lr: 0.176246, top1: 0.72411, throughput: 312.87 | 2022-04-03 12:07:41.888 [rank:5] [train], epoch: 38/50, iter: 834/834, loss: 0.26154, lr: 0.176246, top1: 0.71967, throughput: 313.59 | 2022-04-03 12:07:41.891 [rank:3] [train], epoch: 38/50, iter: 834/834, loss: 0.26646, lr: 0.176246, top1: 0.71599, throughput: 313.34 | 2022-04-03 12:07:41.892 [rank:0] [eval], epoch: 38/50, iter: 125/125, loss: 0.00000, lr: 0.176246, top1: 0.71648, throughput: 482.59 | 2022-04-03 12:07:54.835 [rank:2] [eval], epoch: 38/50, iter: 125/125, loss: 0.00000, lr: 0.176246, top1: 0.70912, throughput: 482.07 | 2022-04-03 12:07:54.840 [rank:4] [eval], epoch: 38/50, iter: 125/125, loss: 0.00000, lr: 0.176246, top1: 0.71088, throughput: 482.09 | 2022-04-03 12:07:54.853 [rank:1] [eval], epoch: 38/50, iter: 125/125, loss: 0.00000, lr: 0.176246, top1: 0.71680, throughput: 481.75 | 2022-04-03 12:07:54.853 [rank:7] [eval], epoch: 38/50, iter: 125/125, loss: 0.00000, lr: 0.176246, top1: 0.72208, throughput: 482.00 | 2022-04-03 12:07:54.855 [rank:3] [eval], epoch: 38/50, iter: 125/125, loss: 0.00000, lr: 0.176246, top1: 0.71456, throughput: 481.96 | 2022-04-03 12:07:54.860 [rank:5] [eval], epoch: 38/50, iter: 125/125, loss: 0.00000, lr: 0.176246, top1: 0.70480, throughput: 481.90 | 2022-04-03 12:07:54.860 [rank:6] [eval], epoch: 38/50, iter: 125/125, loss: 0.00000, lr: 0.176246, top1: 0.71376, throughput: 481.03 | 2022-04-03 12:07:54.875 [rank:7] [train], epoch: 39/50, iter: 100/834, loss: 0.26127, lr: 0.172575, top1: 0.72677, throughput: 312.98 | 2022-04-03 12:08:56.202 [rank:6] [train], epoch: 39/50, iter: 100/834, loss: 0.26350, lr: 0.172575, top1: 0.72458, throughput: 313.01 | 2022-04-03 12:08:56.216 [rank:3] [train], epoch: 39/50, iter: 100/834, loss: 0.26130, lr: 0.172575, top1: 0.72719, throughput: 312.92 | 2022-04-03 12:08:56.217 [rank:5] [train], epoch: 39/50, iter: 100/834, loss: 0.26371, lr: 0.172575, top1: 0.72135, throughput: 312.88 | 2022-04-03 12:08:56.226 [rank:1] [train], epoch: 39/50, iter: 100/834, loss: 0.26234, lr: 0.172575, top1: 0.72578, throughput: 312.72[rank:0] [train], epoch: 39/50, iter: 100/834, loss: 0.25989, lr: 0.172575, top1: 0.72880, throughput: 312.63 | 2022-04-03 12:08:56.250| 2022-04-03 12:08:56.250 [rank:2] [train], epoch: 39/50, iter: 100/834, loss: 0.26064, lr: 0.172575, top1: 0.72833, throughput: 312.55 | 2022-04-03 12:08:56.271 [rank:4] [train], epoch: 39/50, iter: 100/834, loss: 0.26264, lr: 0.172575, top1: 0.71870, throughput: 312.99 | 2022-04-03 12:08:56.196 [rank:5] [train], epoch: 39/50, iter: 200/834, loss: 0.26277, lr: 0.168937, top1: 0.72599, throughput: 315.33 | 2022-04-03 12:09:57.114 [rank:1] [train], epoch: 39/50, iter: 200/834, loss: 0.26106, lr: 0.168937, top1: 0.72411, throughput: 315.43 | 2022-04-03 12:09:57.120 [rank:7] [train], epoch: 39/50, iter: 200/834, loss: 0.26381, lr: 0.168937, top1: 0.72281, throughput: 314.91 | 2022-04-03 12:09:57.172 [rank:0] [train], epoch: 39/50, iter: 200/834, loss: 0.26251, lr: 0.168937, top1: 0.72297, throughput: 315.15 | 2022-04-03 12:09:57.173 [rank:6] [train], epoch: 39/50, iter: 200/834, loss: 0.26408, lr: 0.168937, top1: 0.72115, throughput: 314.97 | 2022-04-03 12:09:57.174 [rank:3] [train], epoch: 39/50, iter: 200/834, loss: 0.26254, lr: 0.168937, top1: 0.72286, throughput: 314.97 | 2022-04-03 12:09:57.174 [rank:4] [train], epoch: 39/50, iter: 200/834, loss: 0.26327, lr: 0.168937, top1: 0.72505, throughput: 314.80 | 2022-04-03 12:09:57.188 [rank:2] [train], epoch: 39/50, iter: 200/834, loss: 0.26155, lr: 0.168937, top1: 0.72458, throughput: 314.93 | 2022-04-03 12:09:57.237 [rank:6] [train], epoch: 39/50, iter: 300/834, loss: 0.26229, lr: 0.165334, top1: 0.72536, throughput: 313.35 | 2022-04-03 12:10:58.446 [rank:5] [train], epoch: 39/50, iter: 300/834, loss: 0.26192, lr: 0.165334, top1: 0.72812, throughput: 313.04 | 2022-04-03 12:10:58.448 [rank:7] [train], epoch: 39/50, iter: 300/834, loss: 0.26418, lr: 0.165334, top1: 0.72229, throughput: 313.31 | 2022-04-03 12:10:58.452 [rank:1] [train], epoch: 39/50, iter: 300/834, loss: 0.26692, lr: 0.165334, top1: 0.71156, throughput: 313.05 | 2022-04-03 12:10:58.453 [rank:0] [train], epoch: 39/50, iter: 300/834, loss: 0.26351, lr: 0.165334, top1: 0.72255, throughput: 313.30 | 2022-04-03 12:10:58.456 [rank:2] [train], epoch: 39/50, iter: 300/834, loss: 0.26456, lr: 0.165334, top1: 0.72146, throughput: 313.63 | 2022-04-03 12:10:58.456 [rank:4] [train], epoch: 39/50, iter: 300/834, loss: 0.26334, lr: 0.165334, top1: 0.72276, throughput: 313.33 | 2022-04-03 12:10:58.464 [rank:3] [train], epoch: 39/50, iter: 300/834, loss: 0.26635, lr: 0.165334, top1: 0.71401, throughput: 313.24 | 2022-04-03 12:10:58.469 [rank:5] [train], epoch: 39/50, iter: 400/834, loss: 0.26218, lr: 0.161764, top1: 0.72260, throughput: 310.87 | 2022-04-03 12:12:00.210 [rank:7] [train], epoch: 39/50, iter: 400/834, loss: 0.26155, lr: 0.161764, top1: 0.72583, throughput: 310.84 | 2022-04-03 12:12:00.221 [rank:6] [train], epoch: 39/50, iter: 400/834, loss: 0.26286, lr: 0.161764, top1: 0.72401, throughput: 310.75 | 2022-04-03 12:12:00.233 [rank:3] [train], epoch: 39/50, iter: 400/834, loss: 0.26371, lr: 0.161764, top1: 0.72219, throughput: 310.85 | 2022-04-03 12:12:00.235 [rank:0] [train], epoch: 39/50, iter: 400/834, loss: 0.26297, lr: 0.161764, top1: 0.72036, throughput: 310.78 | 2022-04-03 12:12:00.237 [rank:2] [train], epoch: 39/50, iter: 400/834, loss: 0.26339, lr: 0.161764, top1: 0.72292, throughput: 310.77 | 2022-04-03 12:12:00.239 [rank:1] [train], epoch: 39/50, iter: 400/834, loss: 0.26308, lr: 0.161764, top1: 0.72203, throughput: 310.69 | 2022-04-03 12:12:00.250 [rank:4] [train], epoch: 39/50, iter: 400/834, loss: 0.26285, lr: 0.161764, top1: 0.72255, throughput: 310.62 | 2022-04-03 12:12:00.276 [rank:2] [train], epoch: 39/50, iter: 500/834, loss: 0.26274, lr: 0.158229, top1: 0.72245, throughput: 312.19 | 2022-04-03 12:13:01.741 [rank:0] [train], epoch: 39/50, iter: 500/834, loss: 0.26468, lr: 0.158229, top1: 0.71609, throughput: 311.91 | 2022-04-03 12:13:01.792 [rank:5] [train], epoch: 39/50, iter: 500/834, loss: 0.26067, lr: 0.158229, top1: 0.72516, throughput: 311.66 | 2022-04-03 12:13:01.815 [rank:6] [train], epoch: 39/50, iter: 500/834, loss: 0.26516, lr: 0.158229, top1: 0.72292, throughput: 311.74 | 2022-04-03 12:13:01.823 [rank:1] [train], epoch: 39/50, iter: 500/834, loss: 0.26353, lr: 0.158229, top1: 0.72078, throughput: 311.81 | 2022-04-03 12:13:01.827 [rank:4] [train], epoch: 39/50, iter: 500/834, loss: 0.26124, lr: 0.158229, top1: 0.72224, throughput: 311.88 | 2022-04-03 12:13:01.838 [rank:7] [train], epoch: 39/50, iter: 500/834, loss: 0.26473, lr: 0.158229, top1: 0.71865, throughput: 311.56 | 2022-04-03 12:13:01.847 [rank:3] [train], epoch: 39/50, iter: 500/834, loss: 0.26341, lr: 0.158229, top1: 0.72068, throughput: 311.63 | 2022-04-03 12:13:01.847 [rank:2] [train], epoch: 39/50, iter: 600/834, loss: 0.26497, lr: 0.154729, top1: 0.71901, throughput: 309.84 | 2022-04-03 12:14:03.708 [rank:3] [train], epoch: 39/50, iter: 600/834, loss: 0.26384, lr: 0.154729, top1: 0.72161, throughput: 310.12 | 2022-04-03 12:14:03.758 [rank:4] [train], epoch: 39/50, iter: 600/834, loss: 0.26255, lr: 0.154729, top1: 0.72484, throughput: 309.98 | 2022-04-03 12:14:03.777 [rank:1] [train], epoch: 39/50, iter: 600/834, loss: 0.26442, lr: 0.154729, top1: 0.71839, throughput: 309.90 | 2022-04-03 12:14:03.783 [rank:6] [train], epoch: 39/50, iter: 600/834, loss: 0.26478, lr: 0.154729, top1: 0.71792, throughput: 309.86 | 2022-04-03 12:14:03.787 [rank:0] [train], epoch: 39/50, iter: 600/834, loss: 0.26330, lr: 0.154729, top1: 0.72047, throughput: 309.64 | 2022-04-03 12:14:03.801 [rank:5] [train], epoch: 39/50, iter: 600/834, loss: 0.26379, lr: 0.154729, top1: 0.72161, throughput: 309.59 | 2022-04-03 12:14:03.833 [rank:7] [train], epoch: 39/50, iter: 600/834, loss: 0.26465, lr: 0.154729, top1: 0.71776, throughput: 310.19 | 2022-04-03 12:14:03.744 [rank:6] [train], epoch: 39/50, iter: 700/834, loss: 0.26334, lr: 0.151264, top1: 0.72354, throughput: 313.67 | 2022-04-03 12:15:04.997 [rank:2] [train], epoch: 39/50, iter: 700/834, loss: 0.26308, lr: 0.151264, top1: 0.72302, throughput: 313.23 | 2022-04-03 12:15:05.005 [rank:1] [train], epoch: 39/50, iter: 700/834, loss: 0.26247, lr: 0.151264, top1: 0.72427, throughput: 313.53 | 2022-04-03 12:15:05.021 [rank:7] [train], epoch: 39/50, iter: 700/834, loss: 0.26366, lr: 0.151264, top1: 0.72078, throughput: 313.29 | 2022-04-03 12:15:05.029 [rank:5] [train], epoch: 39/50, iter: 700/834, loss: 0.26183, lr: 0.151264, top1: 0.72333, throughput: 313.70 | 2022-04-03 12:15:05.038 [rank:4] [train], epoch: 39/50, iter: 700/834, loss: 0.26132, lr: 0.151264, top1: 0.72828, throughput: 313.40 | 2022-04-03 12:15:05.040 [rank:0] [train], epoch: 39/50, iter: 700/834, loss: 0.26663, lr: 0.151264, top1: 0.71839, throughput: 313.35 | 2022-04-03 12:15:05.074 [rank:3] [train], epoch: 39/50, iter: 700/834, loss: 0.26264, lr: 0.151264, top1: 0.72177, throughput: 312.99 | 2022-04-03 12:15:05.101 [rank:4] [train], epoch: 39/50, iter: 800/834, loss: 0.26143, lr: 0.147833, top1: 0.72370, throughput: 313.95 | 2022-04-03 12:16:06.196 [rank:7] [train], epoch: 39/50, iter: 800/834, loss: 0.26188, lr: 0.147833, top1: 0.72521, throughput: 313.84 | 2022-04-03 12:16:06.207 [rank:2] [train], epoch: 39/50, iter: 800/834, loss: 0.26382, lr: 0.147833, top1: 0.72052, throughput: 313.62 | 2022-04-03 12:16:06.226 [rank:5] [train], epoch: 39/50, iter: 800/834, loss: 0.26422, lr: 0.147833, top1: 0.72125, throughput: 313.73 | 2022-04-03 12:16:06.238 [rank:0] [train], epoch: 39/50, iter: 800/834, loss: 0.26468, lr: 0.147833, top1: 0.72026, throughput: 313.91 | 2022-04-03 12:16:06.238 [rank:3] [train], epoch: 39/50, iter: 800/834, loss: 0.26187, lr: 0.147833, top1: 0.72302, throughput: 313.97 | 2022-04-03 12:16:06.255 [rank:6] [train], epoch: 39/50, iter: 800/834, loss: 0.26090, lr: 0.147833, top1: 0.72833, throughput: 313.35 | 2022-04-03 12:16:06.271 [rank:1] [train], epoch: 39/50, iter: 800/834, loss: 0.26480, lr: 0.147833, top1: 0.71708, throughput: 313.91 | 2022-04-03 12:16:06.186 [rank:7] [train], epoch: 39/50, iter: 834/834, loss: 0.26312, lr: 0.146675, top1: 0.72365, throughput: 311.98 | 2022-04-03 12:16:27.131 [rank:2] [train], epoch: 39/50, iter: 834/834, loss: 0.25961, lr: 0.146675, top1: 0.72886, throughput: 312.18 | 2022-04-03 12:16:27.137 [rank:4] [train], epoch: 39/50, iter: 834/834, loss: 0.26583, lr: 0.146675, top1: 0.71140, throughput: 311.72 | 2022-04-03 12:16:27.137 [rank:1] [train], epoch: 39/50, iter: 834/834, loss: 0.26200, lr: 0.146675, top1: 0.72564, throughput: 311.58 | 2022-04-03 12:16:27.138 [rank:6] [train], epoch: 39/50, iter: 834/834, loss: 0.26359, lr: 0.146675, top1: 0.72074, throughput: 312.84 | 2022-04-03 12:16:27.138 [rank:3] [train], epoch: 39/50, iter: 834/834, loss: 0.26228, lr: 0.146675, top1: 0.72549, throughput: 312.41 | 2022-04-03 12:16:27.150 [rank:5] [train], epoch: 39/50, iter: 834/834, loss: 0.26195, lr: 0.146675, top1: 0.73101, throughput: 311.78 | 2022-04-03 12:16:27.175 [rank:0] [train], epoch: 39/50, iter: 834/834, loss: 0.26669, lr: 0.146675, top1: 0.71369, throughput: 311.78 | 2022-04-03 12:16:27.176 [rank:0] [eval], epoch: 39/50, iter: 125/125, loss: 0.00000, lr: 0.146675, top1: 0.72944, throughput: 487.39 | 2022-04-03 12:16:40.000 [rank:1] [eval], epoch: 39/50, iter: 125/125, loss: 0.00000, lr: 0.146675, top1: 0.72800, throughput: 485.75 | 2022-04-03 12:16:40.004 [rank:2] [eval], epoch: 39/50, iter: 125/125, loss: 0.00000, lr: 0.146675, top1: 0.71344, throughput: 485.56 | 2022-04-03 12:16:40.009 [rank:4] [eval], epoch: 39/50, iter: 125/125, loss: 0.00000, lr: 0.146675, top1: 0.72976, throughput: 485.20 | 2022-04-03 12:16:40.019 [rank:5] [eval], epoch: 39/50, iter: 125/125, loss: 0.00000, lr: 0.146675, top1: 0.71696, throughput: 486.39 | 2022-04-03 12:16:40.025 [rank:7] [eval], epoch: 39/50, iter: 125/125, loss: 0.00000, lr: 0.146675, top1: 0.72880, throughput: 484.52 | 2022-04-03 12:16:40.031 [rank:3] [eval], epoch: 39/50, iter: 125/125, loss: 0.00000, lr: 0.146675, top1: 0.72288, throughput: 485.06 | 2022-04-03 12:16:40.035 [rank:6] [eval], epoch: 39/50, iter: 125/125, loss: 0.00000, lr: 0.146675, top1: 0.72736, throughput: 483.63 | 2022-04-03 12:16:40.061 [rank:6] [train], epoch: 40/50, iter: 100/834, loss: 0.25784, lr: 0.143292, top1: 0.73427, throughput: 313.98 | 2022-04-03 12:17:41.212 [rank:1] [train], epoch: 40/50, iter: 100/834, loss: 0.25721, lr: 0.143292, top1: 0.73333, throughput: 313.66 | 2022-04-03 12:17:41.217 [rank:2] [train], epoch: 40/50, iter: 100/834, loss: 0.25755, lr: 0.143292, top1: 0.73286, throughput: 313.65 | 2022-04-03 12:17:41.223 [rank:3] [train], epoch: 40/50, iter: 100/834, loss: 0.25640, lr: 0.143292, top1: 0.73677, throughput: 313.77 | 2022-04-03 12:17:41.225 [rank:5] [train], epoch: 40/50, iter: 100/834, loss: 0.25629, lr: 0.143292, top1: 0.73391, throughput: 313.71 | 2022-04-03 12:17:41.228 [rank:4] [train], epoch: 40/50, iter: 100/834, loss: 0.25835, lr: 0.143292, top1: 0.73000, throughput: 313.55 | 2022-04-03 12:17:41.253 [rank:7] [train], epoch: 40/50, iter: 100/834, loss: 0.25545, lr: 0.143292, top1: 0.73901, throughput: 313.60 | 2022-04-03 12:17:41.256 [rank:0] [train], epoch: 40/50, iter: 100/834, loss: 0.25418, lr: 0.143292, top1: 0.74354, throughput: 313.76 | 2022-04-03 12:17:41.192 [rank:1] [train], epoch: 40/50, iter: 200/834, loss: 0.25791, lr: 0.139944, top1: 0.73354, throughput: 311.56 | 2022-04-03 12:18:42.842 [rank:5] [train], epoch: 40/50, iter: 200/834, loss: 0.25848, lr: 0.139944, top1: 0.73068, throughput: 311.58 | 2022-04-03 12:18:42.849 [rank:6] [train], epoch: 40/50, iter: 200/834, loss: 0.25767, lr: 0.139944, top1: 0.73411, throughput: 311.49 | 2022-04-03 12:18:42.851 [rank:2] [train], epoch: 40/50, iter: 200/834, loss: 0.26143, lr: 0.139944, top1: 0.72729, throughput: 311.54 | 2022-04-03 12:18:42.852 [rank:4] [train], epoch: 40/50, iter: 200/834, loss: 0.25813, lr: 0.139944, top1: 0.73359, throughput: 311.65 | 2022-04-03 12:18:42.860 [rank:7] [train], epoch: 40/50, iter: 200/834, loss: 0.26086, lr: 0.139944, top1: 0.72667, throughput: 311.52 | 2022-04-03 12:18:42.889 [rank:3] [train], epoch: 40/50, iter: 200/834, loss: 0.25858, lr: 0.139944, top1: 0.72979, throughput: 311.34 | 2022-04-03 12:18:42.894 [rank:0] [train], epoch: 40/50, iter: 200/834, loss: 0.25877, lr: 0.139944, top1: 0.72943, throughput: 311.13 | 2022-04-03 12:18:42.903 [rank:2] [train], epoch: 40/50, iter: 300/834, loss: 0.25973, lr: 0.136632, top1: 0.73167, throughput: 314.78 | 2022-04-03 12:19:43.847 [rank:3] [train], epoch: 40/50, iter: 300/834, loss: 0.25766, lr: 0.136632, top1: 0.73312, throughput: 314.96 | 2022-04-03 12:19:43.854 [rank:7] [train], epoch: 40/50, iter: 300/834, loss: 0.26005, lr: 0.136632, top1: 0.73083, throughput: 314.89 | 2022-04-03 12:19:43.863 [rank:0] [train], epoch: 40/50, iter: 300/834, loss: 0.25892, lr: 0.136632, top1: 0.72734, throughput: 314.95 | 2022-04-03 12:19:43.864 [rank:6] [train], epoch: 40/50, iter: 300/834, loss: 0.25780, lr: 0.136632, top1: 0.72943, throughput: 314.66 | 2022-04-03 12:19:43.869 [rank:5] [train], epoch: 40/50, iter: 300/834, loss: 0.25878, lr: 0.136632, top1: 0.73276, throughput: 314.61 | 2022-04-03 12:19:43.876 [rank:1] [train], epoch: 40/50, iter: 300/834, loss: 0.25844, lr: 0.136632, top1: 0.73182, throughput: 314.86 | 2022-04-03 12:19:43.821 [rank:4] [train], epoch: 40/50, iter: 300/834, loss: 0.25931, lr: 0.136632, top1: 0.73083, throughput: 314.37 | 2022-04-03 12:19:43.934 [rank:3] [train], epoch: 40/50, iter: 400/834, loss: 0.25597, lr: 0.133356, top1: 0.73240, throughput: 314.11 | 2022-04-03 12:20:44.980 [rank:0] [train], epoch: 40/50, iter: 400/834, loss: 0.25742, lr: 0.133356, top1: 0.73234, throughput: 314.14 | 2022-04-03 12:20:44.983 [rank:1] [train], epoch: 40/50, iter: 400/834, loss: 0.25880, lr: 0.133356, top1: 0.72995, throughput: 313.91 | 2022-04-03 12:20:44.985 [rank:5] [train], epoch: 40/50, iter: 400/834, loss: 0.25870, lr: 0.133356, top1: 0.73417, throughput: 314.13 | 2022-04-03 12:20:44.996 [rank:2] [train], epoch: 40/50, iter: 400/834, loss: 0.26082, lr: 0.133356, top1: 0.72661, throughput: 313.85 | 2022-04-03 12:20:45.021 [rank:4] [train], epoch: 40/50, iter: 400/834, loss: 0.25810, lr: 0.133356, top1: 0.73198, throughput: 314.27 | 2022-04-03 12:20:45.028 [rank:6] [train], epoch: 40/50, iter: 400/834, loss: 0.25868, lr: 0.133356, top1: 0.73078, throughput: 313.93 | 2022-04-03 12:20:45.029 [rank:7] [train], epoch: 40/50, iter: 400/834, loss: 0.25730, lr: 0.133356, top1: 0.73479, throughput: 313.84 | 2022-04-03 12:20:45.041 [rank:1] [train], epoch: 40/50, iter: 500/834, loss: 0.25884, lr: 0.130115, top1: 0.73000, throughput: 313.40 | 2022-04-03 12:21:46.248 [rank:5] [train], epoch: 40/50, iter: 500/834, loss: 0.25827, lr: 0.130115, top1: 0.73036, throughput: 313.41 | 2022-04-03 12:21:46.258 [rank:3] [train], epoch: 40/50, iter: 500/834, loss: 0.25834, lr: 0.130115, top1: 0.73359, throughput: 313.25 | 2022-04-03 12:21:46.273 [rank:6] [train], epoch: 40/50, iter: 500/834, loss: 0.25928, lr: 0.130115, top1: 0.72906, throughput: 313.37 | 2022-04-03 12:21:46.297 [rank:2] [train], epoch: 40/50, iter: 500/834, loss: 0.26068, lr: 0.130115, top1: 0.72505, throughput: 313.25 | 2022-04-03 12:21:46.313 [rank:0] [train], epoch: 40/50, iter: 500/834, loss: 0.25779, lr: 0.130115, top1: 0.73427, throughput: 313.00 | 2022-04-03 12:21:46.326 [rank:7] [train], epoch: 40/50, iter: 500/834, loss: 0.25869, lr: 0.130115, top1: 0.73120, throughput: 313.24 | 2022-04-03 12:21:46.336 [rank:4] [train], epoch: 40/50, iter: 500/834, loss: 0.26042, lr: 0.130115, top1: 0.72771, throughput: 313.11 | 2022-04-03 12:21:46.349 [rank:6] [train], epoch: 40/50, iter: 600/834, loss: 0.25970, lr: 0.126911, top1: 0.72839, throughput: 310.81 | 2022-04-03 12:22:48.071 [rank:4] [train], epoch: 40/50, iter: 600/834, loss: 0.26020, lr: 0.126911, top1: 0.72880, throughput: 310.98 | 2022-04-03 12:22:48.089 [rank:1] [train], epoch: 40/50, iter: 600/834, loss: 0.25887, lr: 0.126911, top1: 0.73068, throughput: 310.45 | 2022-04-03 12:22:48.095 [rank:2] [train], epoch: 40/50, iter: 600/834, loss: 0.26117, lr: 0.126911, top1: 0.72755, throughput: 310.71 | 2022-04-03 12:22:48.107 [rank:0] [train], epoch: 40/50, iter: 600/834, loss: 0.26032, lr: 0.126911, top1: 0.72734, throughput: 310.71 | 2022-04-03 12:22:48.121 [rank:7] [train], epoch: 40/50, iter: 600/834, loss: 0.26117, lr: 0.126911, top1: 0.72620, throughput: 310.72 | 2022-04-03 12:22:48.128 [rank:5] [train], epoch: 40/50, iter: 600/834, loss: 0.25758, lr: 0.126911, top1: 0.73177, throughput: 310.32 | 2022-04-03 12:22:48.131 [rank:3] [train], epoch: 40/50, iter: 600/834, loss: 0.25894, lr: 0.126911, top1: 0.73130, throughput: 310.31 | 2022-04-03 12:22:48.146 [rank:5] [train], epoch: 40/50, iter: 700/834, loss: 0.25704, lr: 0.123743, top1: 0.73760, throughput: 313.27 | 2022-04-03 12:23:49.419 [rank:6] [train], epoch: 40/50, iter: 700/834, loss: 0.25712, lr: 0.123743, top1: 0.73646, throughput: 312.79 | 2022-04-03 12:23:49.455 [rank:7] [train], epoch: 40/50, iter: 700/834, loss: 0.25861, lr: 0.123743, top1: 0.72870, throughput: 313.06 | 2022-04-03 12:23:49.460 [rank:1] [train], epoch: 40/50, iter: 700/834, loss: 0.26036, lr: 0.123743, top1: 0.73052, throughput: 312.87 | 2022-04-03 12:23:49.462 [rank:3] [train], epoch: 40/50, iter: 700/834, loss: 0.25947, lr: 0.123743, top1: 0.73146, throughput: 312.96 | 2022-04-03 12:23:49.496 [rank:4] [train], epoch: 40/50, iter: 700/834, loss: 0.25895, lr: 0.123743, top1: 0.73099, throughput: 312.65 | 2022-04-03 12:23:49.500 [rank:2] [train], epoch: 40/50, iter: 700/834, loss: 0.25877, lr: 0.123743, top1: 0.72927, throughput: 312.73 | 2022-04-03 12:23:49.501 [rank:0] [train], epoch: 40/50, iter: 700/834, loss: 0.25679, lr: 0.123743, top1: 0.73448, throughput: 312.73 | 2022-04-03 12:23:49.515 [rank:6] [train], epoch: 40/50, iter: 800/834, loss: 0.25819, lr: 0.120612, top1: 0.73229, throughput: 311.98 | 2022-04-03 12:24:50.998 [rank:3] [train], epoch: 40/50, iter: 800/834, loss: 0.25673, lr: 0.120612, top1: 0.73490, throughput: 312.14 | 2022-04-03 12:24:51.008 [rank:5] [train], epoch: 40/50, iter: 800/834, loss: 0.25875, lr: 0.120612, top1: 0.72979, throughput: 311.73 | 2022-04-03 12:24:51.011 [rank:2] [train], epoch: 40/50, iter: 800/834, loss: 0.25771, lr: 0.120612, top1: 0.73286, throughput: 312.04 | 2022-04-03 12:24:51.033 [rank:1] [train], epoch: 40/50, iter: 800/834, loss: 0.25824, lr: 0.120612, top1: 0.73328, throughput: 311.81 | 2022-04-03 12:24:51.038 [rank:4] [train], epoch: 40/50, iter: 800/834, loss: 0.25734, lr: 0.120612, top1: 0.73474, throughput: 312.28 | 2022-04-03 12:24:50.983 [rank:0] [train], epoch: 40/50, iter: 800/834, loss: 0.25782, lr: 0.120612, top1: 0.73141, throughput: 311.89 | 2022-04-03 12:24:51.075 [rank:7] [train], epoch: 40/50, iter: 800/834, loss: 0.25778, lr: 0.120612, top1: 0.73083, throughput: 312.05 | 2022-04-03 12:24:50.988 [rank:6] [train], epoch: 40/50, iter: 834/834, loss: 0.25874, lr: 0.119556, top1: 0.72855, throughput: 314.32 | 2022-04-03 12:25:11.767 [rank:2] [train], epoch: 40/50, iter: 834/834, loss: 0.26055, lr: 0.119556, top1: 0.72304, throughput: 314.82 | 2022-04-03 12:25:11.768 [rank:1] [train], epoch: 40/50, iter: 834/834, loss: 0.25584, lr: 0.119556, top1: 0.74096, throughput: 314.90 | 2022-04-03 12:25:11.769 [rank:7] [train], epoch: 40/50, iter: 834/834, loss: 0.25786, lr: 0.119556, top1: 0.73422, throughput: 314.13 | 2022-04-03 12:25:11.769 [rank:5] [train], epoch: 40/50, iter: 834/834, loss: 0.25776, lr: 0.119556, top1: 0.73208, throughput: 314.37 | 2022-04-03 12:25:11.776 [rank:4] [train], epoch: 40/50, iter: 834/834, loss: 0.26274, lr: 0.119556, top1: 0.72197, throughput: 313.71 | 2022-04-03 12:25:11.792 [rank:3] [train], epoch: 40/50, iter: 834/834, loss: 0.25573, lr: 0.119556, top1: 0.73085, throughput: 313.77 | 2022-04-03 12:25:11.813 [rank:0] [train], epoch: 40/50, iter: 834/834, loss: 0.25427, lr: 0.119556, top1: 0.73606, throughput: 314.78 | 2022-04-03 12:25:11.813 [rank:0] [eval], epoch: 40/50, iter: 125/125, loss: 0.00000, lr: 0.119556, top1: 0.73536, throughput: 489.78 | 2022-04-03 12:25:24.574 [rank:1] [eval], epoch: 40/50, iter: 125/125, loss: 0.00000, lr: 0.119556, top1: 0.73504, throughput: 487.96 | 2022-04-03 12:25:24.577 [rank:2] [eval], epoch: 40/50, iter: 125/125, loss: 0.00000, lr: 0.119556, top1: 0.72672, throughput: 487.48 | 2022-04-03 12:25:24.589 [rank:5] [eval], epoch: 40/50, iter: 125/125, loss: 0.00000, lr: 0.119556, top1: 0.72288, throughput: 487.46 | 2022-04-03 12:25:24.598 [rank:4] [eval], epoch: 40/50, iter: 125/125, loss: 0.00000, lr: 0.119556, top1: 0.73264, throughput: 488.06 | 2022-04-03 12:25:24.598 [rank:7] [eval], epoch: 40/50, iter: 125/125, loss: 0.00000, lr: 0.119556, top1: 0.73920, throughput: 487.15 | 2022-04-03 12:25:24.599 [rank:3] [eval], epoch: 40/50, iter: 125/125, loss: 0.00000, lr: 0.119556, top1: 0.72576, throughput: 488.23 | 2022-04-03 12:25:24.614 [rank:6] [eval], epoch: 40/50, iter: 125/125, loss: 0.00000, lr: 0.119556, top1: 0.73776, throughput: 485.94 | 2022-04-03 12:25:24.628 [rank:6] [train], epoch: 41/50, iter: 100/834, loss: 0.25562, lr: 0.116474, top1: 0.73542, throughput: 313.70 | 2022-04-03 12:26:25.834 [rank:2] [train], epoch: 41/50, iter: 100/834, loss: 0.25246, lr: 0.116474, top1: 0.74844, throughput: 313.49 | 2022-04-03 12:26:25.835 [rank:1] [train], epoch: 41/50, iter: 100/834, loss: 0.25600, lr: 0.116474, top1: 0.73818, throughput: 313.38 | 2022-04-03 12:26:25.844 [rank:7] [train], epoch: 41/50, iter: 100/834, loss: 0.25421, lr: 0.116474, top1: 0.74047, throughput: 313.45 | 2022-04-03 12:26:25.853 [rank:5] [train], epoch: 41/50, iter: 100/834, loss: 0.25447, lr: 0.116474, top1: 0.74182, throughput: 313.42 | 2022-04-03 12:26:25.857 [rank:4] [train], epoch: 41/50, iter: 100/834, loss: 0.25135, lr: 0.116474, top1: 0.74807, throughput: 313.36 | 2022-04-03 12:26:25.869 [rank:3] [train], epoch: 41/50, iter: 100/834, loss: 0.25210, lr: 0.116474, top1: 0.74578, throughput: 313.38 | 2022-04-03 12:26:25.881 [rank:0] [train], epoch: 41/50, iter: 100/834, loss: 0.25539, lr: 0.116474, top1: 0.73760, throughput: 313.16 | 2022-04-03 12:26:25.884 [rank:6] [train], epoch: 41/50, iter: 200/834, loss: 0.25052, lr: 0.113429, top1: 0.75182, throughput: 311.85 | 2022-04-03 12:27:27.402 [rank:5] [train], epoch: 41/50, iter: 200/834, loss: 0.25555, lr: 0.113429, top1: 0.73547, throughput: 311.65 | 2022-04-03 12:27:27.465 [rank:0] [train], epoch: 41/50, iter: 200/834, loss: 0.25441, lr: 0.113429, top1: 0.73807, throughput: 311.75 | 2022-04-03 12:27:27.473 [rank:1] [train], epoch: 41/50, iter: 200/834, loss: 0.25443, lr: 0.113429, top1: 0.73932, throughput: 311.53 | 2022-04-03 12:27:27.475 [rank:7] [train], epoch: 41/50, iter: 200/834, loss: 0.25456, lr: 0.113429, top1: 0.74026, throughput: 311.55 | 2022-04-03 12:27:27.481 [rank:2] [train], epoch: 41/50, iter: 200/834, loss: 0.25423, lr: 0.113429, top1: 0.74302, throughput: 311.46 | 2022-04-03 12:27:27.481 [rank:3] [train], epoch: 41/50, iter: 200/834, loss: 0.25339, lr: 0.113429, top1: 0.74526, throughput: 311.59 | 2022-04-03 12:27:27.500 [rank:4] [train], epoch: 41/50, iter: 200/834, loss: 0.25241, lr: 0.113429, top1: 0.74724, throughput: 311.42 | 2022-04-03 12:27:27.522 [rank:4] [train], epoch: 41/50, iter: 300/834, loss: 0.25534, lr: 0.110422, top1: 0.73776, throughput: 313.22 | 2022-04-03 12:28:28.821 [rank:6] [train], epoch: 41/50, iter: 300/834, loss: 0.25383, lr: 0.110422, top1: 0.74000, throughput: 312.48 | 2022-04-03 12:28:28.846 [rank:1] [train], epoch: 41/50, iter: 300/834, loss: 0.25487, lr: 0.110422, top1: 0.73828, throughput: 312.83 | 2022-04-03 12:28:28.850 [rank:7] [train], epoch: 41/50, iter: 300/834, loss: 0.25577, lr: 0.110422, top1: 0.73901, throughput: 312.83 | 2022-04-03 12:28:28.857 [rank:3] [train], epoch: 41/50, iter: 300/834, loss: 0.25123, lr: 0.110422, top1: 0.74479, throughput: 312.88 | 2022-04-03 12:28:28.866 [rank:0] [train], epoch: 41/50, iter: 300/834, loss: 0.25327, lr: 0.110422, top1: 0.74365, throughput: 312.65 | 2022-04-03 12:28:28.884 [rank:2] [train], epoch: 41/50, iter: 300/834, loss: 0.25392, lr: 0.110422, top1: 0.74417, throughput: 313.02 | 2022-04-03 12:28:28.818 [rank:5] [train], epoch: 41/50, iter: 300/834, loss: 0.25608, lr: 0.110422, top1: 0.73906, throughput: 312.87 | 2022-04-03 12:28:28.832 [rank:7] [train], epoch: 41/50, iter: 400/834, loss: 0.25244, lr: 0.107451, top1: 0.74375, throughput: 313.31 | 2022-04-03 12:29:30.137 [rank:2] [train], epoch: 41/50, iter: 400/834, loss: 0.25509, lr: 0.107451, top1: 0.73927, throughput: 313.06 | 2022-04-03 12:29:30.148 [rank:6] [train], epoch: 41/50, iter: 400/834, loss: 0.25603, lr: 0.107451, top1: 0.73323, throughput: 313.20 | 2022-04-03 12:29:30.149 [rank:1] [train], epoch: 41/50, iter: 400/834, loss: 0.25406, lr: 0.107451, top1: 0.74172, throughput: 313.17 | 2022-04-03 12:29:30.158 [rank:3] [train], epoch: 41/50, iter: 400/834, loss: 0.25408, lr: 0.107451, top1: 0.74370, throughput: 313.01 | 2022-04-03 12:29:30.205 [rank:4] [train], epoch: 41/50, iter: 400/834, loss: 0.25261, lr: 0.107451, top1: 0.74365, throughput: 312.73 | 2022-04-03 12:29:30.217 [rank:0] [train], epoch: 41/50, iter: 400/834, loss: 0.25269, lr: 0.107451, top1: 0.74208, throughput: 313.00 | 2022-04-03 12:29:30.226 [rank:5] [train], epoch: 41/50, iter: 400/834, loss: 0.25362, lr: 0.107451, top1: 0.74307, throughput: 312.59 | 2022-04-03 12:29:30.255 [rank:4] [train], epoch: 41/50, iter: 500/834, loss: 0.25436, lr: 0.104518, top1: 0.74193, throughput: 313.13 | 2022-04-03 12:30:31.533 [rank:5] [train], epoch: 41/50, iter: 500/834, loss: 0.25577, lr: 0.104518, top1: 0.73781, throughput: 313.26 | 2022-04-03 12:30:31.546 [rank:7] [train], epoch: 41/50, iter: 500/834, loss: 0.25521, lr: 0.104518, top1: 0.73812, throughput: 312.61 | 2022-04-03 12:30:31.555 [rank:3] [train], epoch: 41/50, iter: 500/834, loss: 0.25529, lr: 0.104518, top1: 0.73891, throughput: 312.91 | 2022-04-03 12:30:31.564 [rank:1] [train], epoch: 41/50, iter: 500/834, loss: 0.25658, lr: 0.104518, top1: 0.73672, throughput: 312.59 | 2022-04-03 12:30:31.580 [rank:2] [train], epoch: 41/50, iter: 500/834, loss: 0.25583, lr: 0.104518, top1: 0.73964, throughput: 312.53 | 2022-04-03 12:30:31.581 [rank:6] [train], epoch: 41/50, iter: 500/834, loss: 0.25334, lr: 0.104518, top1: 0.74234, throughput: 312.45 | 2022-04-03 12:30:31.600 [rank:0] [train], epoch: 41/50, iter: 500/834, loss: 0.25449, lr: 0.104518, top1: 0.73990, throughput: 313.22 | 2022-04-03 12:30:31.525 [rank:7] [train], epoch: 41/50, iter: 600/834, loss: 0.25594, lr: 0.101623, top1: 0.74167, throughput: 311.64 | 2022-04-03 12:31:33.165 [rank:6] [train], epoch: 41/50, iter: 600/834, loss: 0.25371, lr: 0.101623, top1: 0.74005, throughput: 311.84 | 2022-04-03 12:31:33.170 [rank:1] [train], epoch: 41/50, iter: 600/834, loss: 0.25467, lr: 0.101623, top1: 0.73885, throughput: 311.67 | 2022-04-03 12:31:33.184 [rank:3] [train], epoch: 41/50, iter: 600/834, loss: 0.25508, lr: 0.101623, top1: 0.74328, throughput: 311.51 | 2022-04-03 12:31:33.200 [rank:5] [train], epoch: 41/50, iter: 600/834, loss: 0.25497, lr: 0.101623, top1: 0.73792, throughput: 311.33 | 2022-04-03 12:31:33.218 [rank:0] [train], epoch: 41/50, iter: 600/834, loss: 0.25607, lr: 0.101623, top1: 0.73552, throughput: 311.20 | 2022-04-03 12:31:33.222 [rank:2] [train], epoch: 41/50, iter: 600/834, loss: 0.25115, lr: 0.101623, top1: 0.74745, throughput: 311.40 | 2022-04-03 12:31:33.239 [rank:4] [train], epoch: 41/50, iter: 600/834, loss: 0.25431, lr: 0.101623, top1: 0.73563, throughput: 311.13 | 2022-04-03 12:31:33.243 [rank:1] [train], epoch: 41/50, iter: 700/834, loss: 0.25481, lr: 0.098766, top1: 0.73839, throughput: 313.15 | 2022-04-03 12:32:34.497 [rank:0] [train], epoch: 41/50, iter: 700/834, loss: 0.25339, lr: 0.098766, top1: 0.74443, throughput: 313.27 | 2022-04-03 12:32:34.511 [rank:3] [train], epoch: 41/50, iter: 700/834, loss: 0.25321, lr: 0.098766, top1: 0.74203, throughput: 313.15 | 2022-04-03 12:32:34.512 [rank:6] [train], epoch: 41/50, iter: 700/834, loss: 0.25424, lr: 0.098766, top1: 0.74151, throughput: 312.84 | 2022-04-03 12:32:34.544 [rank:5] [train], epoch: 41/50, iter: 700/834, loss: 0.25134, lr: 0.098766, top1: 0.74302, throughput: 313.06 | 2022-04-03 12:32:34.548 [rank:2] [train], epoch: 41/50, iter: 700/834, loss: 0.25318, lr: 0.098766, top1: 0.74370, throughput: 313.15 | 2022-04-03 12:32:34.552 [rank:4] [train], epoch: 41/50, iter: 700/834, loss: 0.25252, lr: 0.098766, top1: 0.74365, throughput: 313.09 | 2022-04-03 12:32:34.567 [rank:7] [train], epoch: 41/50, iter: 700/834, loss: 0.25380, lr: 0.098766, top1: 0.74193, throughput: 313.13 | 2022-04-03 12:32:34.481 [rank:2] [train], epoch: 41/50, iter: 800/834, loss: 0.25477, lr: 0.095946, top1: 0.74068, throughput: 313.42 | 2022-04-03 12:33:35.811 [rank:6] [train], epoch: 41/50, iter: 800/834, loss: 0.25382, lr: 0.095946, top1: 0.74156, throughput: 313.29 | 2022-04-03 12:33:35.828 [rank:1] [train], epoch: 41/50, iter: 800/834, loss: 0.25687, lr: 0.095946, top1: 0.73453, throughput: 312.98 | 2022-04-03 12:33:35.842 [rank:3] [train], epoch: 41/50, iter: 800/834, loss: 0.25524, lr: 0.095946, top1: 0.73734, throughput: 312.84 | 2022-04-03 12:33:35.886 [rank:7] [train], epoch: 41/50, iter: 800/834, loss: 0.25477, lr: 0.095946, top1: 0.73594, throughput: 312.64 | 2022-04-03 12:33:35.893 [rank:5] [train], epoch: 41/50, iter: 800/834, loss: 0.25455, lr: 0.095946, top1: 0.74208, throughput: 312.96 | 2022-04-03 12:33:35.897 [rank:4] [train], epoch: 41/50, iter: 800/834, loss: 0.25143, lr: 0.095946, top1: 0.74240, throughput: 313.01 | 2022-04-03 12:33:35.907 [rank:0] [train], epoch: 41/50, iter: 800/834, loss: 0.25293, lr: 0.095946, top1: 0.74318, throughput: 312.53 | 2022-04-03 12:33:35.945 [rank:0] [train], epoch: 41/50, iter: 834/834, loss: 0.25664, lr: 0.094996, top1: 0.73820, throughput: 313.19 | 2022-04-03 12:33:56.788 [rank:5] [train], epoch: 41/50, iter: 834/834, loss: 0.25670, lr: 0.094996, top1: 0.73254, throughput: 312.47 | 2022-04-03 12:33:56.789 [rank:6] [train], epoch: 41/50, iter: 834/834, loss: 0.25400, lr: 0.094996, top1: 0.73591, throughput: 311.36 | 2022-04-03 12:33:56.794 [rank:1] [train], epoch: 41/50, iter: 834/834, loss: 0.25361, lr: 0.094996, top1: 0.74295, throughput: 311.54 | 2022-04-03 12:33:56.796 [rank:3] [train], epoch: 41/50, iter: 834/834, loss: 0.25527, lr: 0.094996, top1: 0.73223, throughput: 312.19 | 2022-04-03 12:33:56.796 [rank:2] [train], epoch: 41/50, iter: 834/834, loss: 0.25484, lr: 0.094996, top1: 0.73330, throughput: 311.04 | 2022-04-03 12:33:56.799 [rank:4] [train], epoch: 41/50, iter: 834/834, loss: 0.25135, lr: 0.094996, top1: 0.74020, throughput: 312.45 | 2022-04-03 12:33:56.800 [rank:7] [train], epoch: 41/50, iter: 834/834, loss: 0.25756, lr: 0.094996, top1: 0.73606, throughput: 312.17 | 2022-04-03 12:33:56.804 [rank:0] [eval], epoch: 41/50, iter: 125/125, loss: 0.00000, lr: 0.094996, top1: 0.75152, throughput: 488.59 | 2022-04-03 12:34:09.580 [rank:2] [eval], epoch: 41/50, iter: 125/125, loss: 0.00000, lr: 0.094996, top1: 0.73232, throughput: 488.66 | 2022-04-03 12:34:09.589 [rank:1] [eval], epoch: 41/50, iter: 125/125, loss: 0.00000, lr: 0.094996, top1: 0.74224, throughput: 488.53 | 2022-04-03 12:34:09.589 [rank:4] [eval], epoch: 41/50, iter: 125/125, loss: 0.00000, lr: 0.094996, top1: 0.74032, throughput: 488.21 | 2022-04-03 12:34:09.602 [rank:5] [eval], epoch: 41/50, iter: 125/125, loss: 0.00000, lr: 0.094996, top1: 0.73232, throughput: 487.70 | 2022-04-03 12:34:09.604 [rank:3] [eval], epoch: 41/50, iter: 125/125, loss: 0.00000, lr: 0.094996, top1: 0.73552, throughput: 487.87 | 2022-04-03 12:34:09.607 [rank:7] [eval], epoch: 41/50, iter: 125/125, loss: 0.00000, lr: 0.094996, top1: 0.74624, throughput: 488.14 | 2022-04-03 12:34:09.608 [rank:6] [eval], epoch: 41/50, iter: 125/125, loss: 0.00000, lr: 0.094996, top1: 0.74512, throughput: 486.31 | 2022-04-03 12:34:09.646 [rank:5] [train], epoch: 42/50, iter: 100/834, loss: 0.24910, lr: 0.092228, top1: 0.75063, throughput: 313.52 | 2022-04-03 12:35:10.843 [rank:3] [train], epoch: 42/50, iter: 100/834, loss: 0.24939, lr: 0.092228, top1: 0.75141, throughput: 313.49 | 2022-04-03 12:35:10.853 [rank:1] [train], epoch: 42/50, iter: 100/834, loss: 0.25037, lr: 0.092228, top1: 0.74932, throughput: 313.39 | 2022-04-03 12:35:10.855 [rank:4] [train], epoch: 42/50, iter: 100/834, loss: 0.25041, lr: 0.092228, top1: 0.74813, throughput: 313.37 | 2022-04-03 12:35:10.871 [rank:2] [train], epoch: 42/50, iter: 100/834, loss: 0.24837, lr: 0.092228, top1: 0.75391, throughput: 313.28 | 2022-04-03 12:35:10.876 [rank:7] [train], epoch: 42/50, iter: 100/834, loss: 0.24915, lr: 0.092228, top1: 0.75094, throughput: 313.28 | 2022-04-03 12:35:10.895 [rank:0] [train], epoch: 42/50, iter: 100/834, loss: 0.25110, lr: 0.092228, top1: 0.74911, throughput: 313.13 | 2022-04-03 12:35:10.896 [rank:6] [train], epoch: 42/50, iter: 100/834, loss: 0.25038, lr: 0.092228, top1: 0.74776, throughput: 313.30 | 2022-04-03 12:35:10.929 [rank:2] [train], epoch: 42/50, iter: 200/834, loss: 0.24870, lr: 0.089498, top1: 0.75385, throughput: 312.30 | 2022-04-03 12:36:12.355 [rank:3] [train], epoch: 42/50, iter: 200/834, loss: 0.25065, lr: 0.089498, top1: 0.74974, throughput: 312.00 | 2022-04-03 12:36:12.391 [rank:1] [train], epoch: 42/50, iter: 200/834, loss: 0.25236, lr: 0.089498, top1: 0.74312, throughput: 311.99 | 2022-04-03 12:36:12.395 [rank:7] [train], epoch: 42/50, iter: 200/834, loss: 0.24824, lr: 0.089498, top1: 0.75167, throughput: 312.15 | 2022-04-03 12:36:12.405 [rank:5] [train], epoch: 42/50, iter: 200/834, loss: 0.25017, lr: 0.089498, top1: 0.74953, throughput: 311.86 | 2022-04-03 12:36:12.410 [rank:6] [train], epoch: 42/50, iter: 200/834, loss: 0.25049, lr: 0.089498, top1: 0.74604, throughput: 312.11 | 2022-04-03 12:36:12.446 [rank:4] [train], epoch: 42/50, iter: 200/834, loss: 0.24992, lr: 0.089498, top1: 0.74948, throughput: 312.26 | 2022-04-03 12:36:12.357 [rank:0] [train], epoch: 42/50, iter: 200/834, loss: 0.24920, lr: 0.089498, top1: 0.75182, throughput: 311.59 | 2022-04-03 12:36:12.514 [rank:0] [train], epoch: 42/50, iter: 300/834, loss: 0.25263, lr: 0.086807, top1: 0.74271, throughput: 313.25 | 2022-04-03 12:37:13.808 [rank:3] [train], epoch: 42/50, iter: 300/834, loss: 0.25248, lr: 0.086807, top1: 0.74594, throughput: 312.55 | 2022-04-03 12:37:13.821 [rank:5] [train], epoch: 42/50, iter: 300/834, loss: 0.25019, lr: 0.086807, top1: 0.74766, throughput: 312.57 | 2022-04-03 12:37:13.836 [rank:1] [train], epoch: 42/50, iter: 300/834, loss: 0.25135, lr: 0.086807, top1: 0.74427, throughput: 312.26 | 2022-04-03 12:37:13.881 [rank:7] [train], epoch: 42/50, iter: 300/834, loss: 0.24810, lr: 0.086807, top1: 0.75276, throughput: 312.24 | 2022-04-03 12:37:13.895 [rank:4] [train], epoch: 42/50, iter: 300/834, loss: 0.24719, lr: 0.086807, top1: 0.75448, throughput: 312.00 | 2022-04-03 12:37:13.896 [rank:6] [train], epoch: 42/50, iter: 300/834, loss: 0.24766, lr: 0.086807, top1: 0.75344, throughput: 312.39 | 2022-04-03 12:37:13.907 [rank:2] [train], epoch: 42/50, iter: 300/834, loss: 0.24984, lr: 0.086807, top1: 0.75120, throughput: 311.88 | 2022-04-03 12:37:13.918 [rank:7] [train], epoch: 42/50, iter: 400/834, loss: 0.25145, lr: 0.084154, top1: 0.74583, throughput: 311.06 | 2022-04-03 12:38:15.620 [rank:1] [train], epoch: 42/50, iter: 400/834, loss: 0.24830, lr: 0.084154, top1: 0.75495, throughput: 310.98 | 2022-04-03 12:38:15.622 [rank:2] [train], epoch: 42/50, iter: 400/834, loss: 0.24763, lr: 0.084154, top1: 0.75286, throughput: 311.14 | 2022-04-03 12:38:15.626 [rank:6] [train], epoch: 42/50, iter: 400/834, loss: 0.25044, lr: 0.084154, top1: 0.74599, throughput: 311.07 | 2022-04-03 12:38:15.629 [rank:4] [train], epoch: 42/50, iter: 400/834, loss: 0.24953, lr: 0.084154, top1: 0.74885, throughput: 310.91 | 2022-04-03 12:38:15.651 [rank:3] [train], epoch: 42/50, iter: 400/834, loss: 0.24919, lr: 0.084154, top1: 0.74979, throughput: 310.46 | 2022-04-03 12:38:15.666 [rank:0] [train], epoch: 42/50, iter: 400/834, loss: 0.25221, lr: 0.084154, top1: 0.74755, throughput: 310.36 | 2022-04-03 12:38:15.672 [rank:5] [train], epoch: 42/50, iter: 400/834, loss: 0.24839, lr: 0.084154, top1: 0.75208, throughput: 310.87 | 2022-04-03 12:38:15.599 [rank:3] [train], epoch: 42/50, iter: 500/834, loss: 0.24853, lr: 0.081540, top1: 0.75120, throughput: 314.50 | 2022-04-03 12:39:16.714 [rank:7] [train], epoch: 42/50, iter: 500/834, loss: 0.25068, lr: 0.081540, top1: 0.74667, throughput: 314.25 | 2022-04-03 12:39:16.719 [rank:6] [train], epoch: 42/50, iter: 500/834, loss: 0.25015, lr: 0.081540, top1: 0.74630, throughput: 314.17 | 2022-04-03 12:39:16.743 [rank:2] [train], epoch: 42/50, iter: 500/834, loss: 0.24992, lr: 0.081540, top1: 0.75109, throughput: 314.15 | 2022-04-03 12:39:16.743 [rank:1] [train], epoch: 42/50, iter: 500/834, loss: 0.25076, lr: 0.081540, top1: 0.74885, throughput: 314.12 | 2022-04-03 12:39:16.744 [rank:5] [train], epoch: 42/50, iter: 500/834, loss: 0.24792, lr: 0.081540, top1: 0.75234, throughput: 313.94 | 2022-04-03 12:39:16.757 [rank:0] [train], epoch: 42/50, iter: 500/834, loss: 0.24778, lr: 0.081540, top1: 0.75490, throughput: 314.20 | 2022-04-03 12:39:16.779 [rank:4] [train], epoch: 42/50, iter: 500/834, loss: 0.24821, lr: 0.081540, top1: 0.75245, throughput: 314.51 | 2022-04-03 12:39:16.699 [rank:3] [train], epoch: 42/50, iter: 600/834, loss: 0.25082, lr: 0.078965, top1: 0.74578, throughput: 314.30 | 2022-04-03 12:40:17.802 [rank:1] [train], epoch: 42/50, iter: 600/834, loss: 0.25307, lr: 0.078965, top1: 0.74312, throughput: 314.46 | 2022-04-03 12:40:17.802 [rank:2] [train], epoch: 42/50, iter: 600/834, loss: 0.25121, lr: 0.078965, top1: 0.74974, throughput: 314.26 | 2022-04-03 12:40:17.840 [rank:0] [train], epoch: 42/50, iter: 600/834, loss: 0.24822, lr: 0.078965, top1: 0.75297, throughput: 314.40 | 2022-04-03 12:40:17.848 [rank:5] [train], epoch: 42/50, iter: 600/834, loss: 0.25128, lr: 0.078965, top1: 0.74776, throughput: 314.28 | 2022-04-03 12:40:17.849 [rank:6] [train], epoch: 42/50, iter: 600/834, loss: 0.24882, lr: 0.078965, top1: 0.75198, throughput: 314.18 | 2022-04-03 12:40:17.853 [rank:7] [train], epoch: 42/50, iter: 600/834, loss: 0.24858, lr: 0.078965, top1: 0.75187, throughput: 314.02 | 2022-04-03 12:40:17.861 [rank:4] [train], epoch: 42/50, iter: 600/834, loss: 0.24854, lr: 0.078965, top1: 0.75313, throughput: 314.31 | 2022-04-03 12:40:17.785 [rank:2] [train], epoch: 42/50, iter: 700/834, loss: 0.25193, lr: 0.076429, top1: 0.74885, throughput: 311.90 | 2022-04-03 12:41:19.398 [rank:3] [train], epoch: 42/50, iter: 700/834, loss: 0.25024, lr: 0.076429, top1: 0.74740, throughput: 311.60 | 2022-04-03 12:41:19.419 [rank:4] [train], epoch: 42/50, iter: 700/834, loss: 0.25079, lr: 0.076429, top1: 0.74776, throughput: 311.47 | 2022-04-03 12:41:19.428 [rank:6] [train], epoch: 42/50, iter: 700/834, loss: 0.25089, lr: 0.076429, top1: 0.74620, throughput: 311.77 | 2022-04-03 12:41:19.436 [rank:1] [train], epoch: 42/50, iter: 700/834, loss: 0.25221, lr: 0.076429, top1: 0.74646, throughput: 311.49 | 2022-04-03 12:41:19.442 [rank:5] [train], epoch: 42/50, iter: 700/834, loss: 0.24858, lr: 0.076429, top1: 0.75234, throughput: 311.68 | 2022-04-03 12:41:19.450 [rank:0] [train], epoch: 42/50, iter: 700/834, loss: 0.24923, lr: 0.076429, top1: 0.74953, throughput: 311.56 | 2022-04-03 12:41:19.474 [rank:7] [train], epoch: 42/50, iter: 700/834, loss: 0.24737, lr: 0.076429, top1: 0.75656, throughput: 312.04 | 2022-04-03 12:41:19.392 [rank:7] [train], epoch: 42/50, iter: 800/834, loss: 0.24839, lr: 0.073933, top1: 0.75302, throughput: 313.48 | 2022-04-03 12:42:20.639 [rank:1] [train], epoch: 42/50, iter: 800/834, loss: 0.24898, lr: 0.073933, top1: 0.75052, throughput: 313.59 | 2022-04-03 12:42:20.668 [rank:5] [train], epoch: 42/50, iter: 800/834, loss: 0.24915, lr: 0.073933, top1: 0.75073, throughput: 313.63 | 2022-04-03 12:42:20.669 [rank:2] [train], epoch: 42/50, iter: 800/834, loss: 0.24981, lr: 0.073933, top1: 0.75104, throughput: 313.20 | 2022-04-03 12:42:20.700 [rank:3] [train], epoch: 42/50, iter: 800/834, loss: 0.25106, lr: 0.073933, top1: 0.74750, throughput: 313.31 | 2022-04-03 12:42:20.700 [rank:4] [train], epoch: 42/50, iter: 800/834, loss: 0.25075, lr: 0.073933, top1: 0.74750, throughput: 313.32 | 2022-04-03 12:42:20.708 [rank:6] [train], epoch: 42/50, iter: 800/834, loss: 0.24978, lr: 0.073933, top1: 0.75047, throughput: 313.36 | 2022-04-03 12:42:20.708 [rank:0] [train], epoch: 42/50, iter: 800/834, loss: 0.25038, lr: 0.073933, top1: 0.74719, throughput: 313.47 | 2022-04-03 12:42:20.723 [rank:1] [train], epoch: 42/50, iter: 834/834, loss: 0.24792, lr: 0.073093, top1: 0.74893, throughput: 310.44 | 2022-04-03 12:42:41.696 [rank:2] [train], epoch: 42/50, iter: 834/834, loss: 0.24995, lr: 0.073093, top1: 0.74663, throughput: 310.85 | 2022-04-03 12:42:41.700 [rank:6] [train], epoch: 42/50, iter: 834/834, loss: 0.24769, lr: 0.073093, top1: 0.75337, throughput: 310.97 | 2022-04-03 12:42:41.700 [rank:0] [train], epoch: 42/50, iter: 834/834, loss: 0.25454, lr: 0.073093, top1: 0.73499, throughput: 311.10 | 2022-04-03 12:42:41.707 [rank:4] [train], epoch: 42/50, iter: 834/834, loss: 0.24990, lr: 0.073093, top1: 0.74923, throughput: 310.82 | 2022-04-03 12:42:41.710 [rank:3] [train], epoch: 42/50, iter: 834/834, loss: 0.24720, lr: 0.073093, top1: 0.75766, throughput: 310.72 | 2022-04-03 12:42:41.709 [rank:5] [train], epoch: 42/50, iter: 834/834, loss: 0.24889, lr: 0.073093, top1: 0.74678, throughput: 310.12 | 2022-04-03 12:42:41.719 [rank:7] [train], epoch: 42/50, iter: 834/834, loss: 0.24757, lr: 0.073093, top1: 0.75628, throughput: 309.23 | 2022-04-03 12:42:41.750 [rank:0] [eval], epoch: 42/50, iter: 125/125, loss: 0.00000, lr: 0.073093, top1: 0.74336, throughput: 489.92 | 2022-04-03 12:42:54.464 [rank:1] [eval], epoch: 42/50, iter: 125/125, loss: 0.00000, lr: 0.073093, top1: 0.75120, throughput: 489.21 | 2022-04-03 12:42:54.472 [rank:2] [eval], epoch: 42/50, iter: 125/125, loss: 0.00000, lr: 0.073093, top1: 0.73840, throughput: 489.23 | 2022-04-03 12:42:54.475 [rank:3] [eval], epoch: 42/50, iter: 125/125, loss: 0.00000, lr: 0.073093, top1: 0.74416, throughput: 489.41 | 2022-04-03 12:42:54.480 [rank:4] [eval], epoch: 42/50, iter: 125/125, loss: 0.00000, lr: 0.073093, top1: 0.74384, throughput: 489.31 | 2022-04-03 12:42:54.483 [rank:7] [eval], epoch: 42/50, iter: 125/125, loss: 0.00000, lr: 0.073093, top1: 0.75024, throughput: 490.49 | 2022-04-03 12:42:54.492 [rank:5] [eval], epoch: 42/50, iter: 125/125, loss: 0.00000, lr: 0.073093, top1: 0.73584, throughput: 488.84 | 2022-04-03 12:42:54.504 [rank:6] [eval], epoch: 42/50, iter: 125/125, loss: 0.00000, lr: 0.073093, top1: 0.74720, throughput: 487.95 | 2022-04-03 12:42:54.509 [rank:6] [train], epoch: 43/50, iter: 100/834, loss: 0.24447, lr: 0.070649, top1: 0.76391, throughput: 313.37 | 2022-04-03 12:43:55.779 [rank:7] [train], epoch: 43/50, iter: 100/834, loss: 0.24566, lr: 0.070649, top1: 0.75984, throughput: 313.16 | 2022-04-03 12:43:55.803 [rank:1] [train], epoch: 43/50, iter: 100/834, loss: 0.24644, lr: 0.070649, top1: 0.75969, throughput: 313.05 | 2022-04-03 12:43:55.804 [rank:2] [train], epoch: 43/50, iter: 100/834, loss: 0.24629, lr: 0.070649, top1: 0.75693, throughput: 313.00 | 2022-04-03 12:43:55.818 [rank:0] [train], epoch: 43/50, iter: 100/834, loss: 0.24620, lr: 0.070649, top1: 0.75672, throughput: 312.92 | 2022-04-03 12:43:55.822 [rank:3] [train], epoch: 43/50, iter: 100/834, loss: 0.24545, lr: 0.070649, top1: 0.75839, throughput: 312.96 | 2022-04-03 12:43:55.830 [rank:4] [train], epoch: 43/50, iter: 100/834, loss: 0.24689, lr: 0.070649, top1: 0.75740, throughput: 312.95 | 2022-04-03 12:43:55.834 [rank:5] [train], epoch: 43/50, iter: 100/834, loss: 0.24379, lr: 0.070649, top1: 0.76411, throughput: 313.04 | 2022-04-03 12:43:55.838 [rank:1] [train], epoch: 43/50, iter: 200/834, loss: 0.24475, lr: 0.068245, top1: 0.75937, throughput: 313.23 | 2022-04-03 12:44:57.101 [rank:2] [train], epoch: 43/50, iter: 200/834, loss: 0.24387, lr: 0.068245, top1: 0.76307, throughput: 313.23 | 2022-04-03 12:44:57.115 [rank:5] [train], epoch: 43/50, iter: 200/834, loss: 0.24520, lr: 0.068245, top1: 0.75979, throughput: 313.23 | 2022-04-03 12:44:57.135 [rank:3] [train], epoch: 43/50, iter: 200/834, loss: 0.24481, lr: 0.068245, top1: 0.75745, throughput: 313.14 | 2022-04-03 12:44:57.144 [rank:7] [train], epoch: 43/50, iter: 200/834, loss: 0.24395, lr: 0.068245, top1: 0.76161, throughput: 312.94 | 2022-04-03 12:44:57.157 [rank:6] [train], epoch: 43/50, iter: 200/834, loss: 0.24495, lr: 0.068245, top1: 0.76047, throughput: 312.74 | 2022-04-03 12:44:57.171 [rank:4] [train], epoch: 43/50, iter: 200/834, loss: 0.24520, lr: 0.068245, top1: 0.76125, throughput: 313.00 | 2022-04-03 12:44:57.175 [rank:0] [train], epoch: 43/50, iter: 200/834, loss: 0.24604, lr: 0.068245, top1: 0.75828, throughput: 312.69 | 2022-04-03 12:44:57.226 [rank:0] [train], epoch: 43/50, iter: 300/834, loss: 0.24624, lr: 0.065880, top1: 0.75703, throughput: 313.82 | 2022-04-03 12:45:58.407 [rank:2] [train], epoch: 43/50, iter: 300/834, loss: 0.24533, lr: 0.065880, top1: 0.75833, throughput: 312.85 | 2022-04-03 12:45:58.486 [rank:1] [train], epoch: 43/50, iter: 300/834, loss: 0.24609, lr: 0.065880, top1: 0.75943, throughput: 312.78 | 2022-04-03 12:45:58.486 [rank:7] [train], epoch: 43/50, iter: 300/834, loss: 0.24584, lr: 0.065880, top1: 0.75964, throughput: 313.06 | 2022-04-03 12:45:58.487 [rank:5] [train], epoch: 43/50, iter: 300/834, loss: 0.24644, lr: 0.065880, top1: 0.75927, throughput: 312.94 | 2022-04-03 12:45:58.489 [rank:3] [train], epoch: 43/50, iter: 300/834, loss: 0.24471, lr: 0.065880, top1: 0.76047, throughput: 312.91 | 2022-04-03 12:45:58.503 [rank:6] [train], epoch: 43/50, iter: 300/834, loss: 0.24677, lr: 0.065880, top1: 0.75578, throughput: 313.34 | 2022-04-03 12:45:58.446 [rank:4] [train], epoch: 43/50, iter: 300/834, loss: 0.24724, lr: 0.065880, top1: 0.75917, throughput: 313.30 | 2022-04-03 12:45:58.458 [rank:7] [train], epoch: 43/50, iter: 400/834, loss: 0.24569, lr: 0.063556, top1: 0.76339, throughput: 313.27 | 2022-04-03 12:46:59.777 [rank:2] [train], epoch: 43/50, iter: 400/834, loss: 0.24795, lr: 0.063556, top1: 0.75589, throughput: 313.25 | 2022-04-03 12:46:59.778 [rank:4] [train], epoch: 43/50, iter: 400/834, loss: 0.24490, lr: 0.063556, top1: 0.75802, throughput: 313.06 | 2022-04-03 12:46:59.788 [rank:0] [train], epoch: 43/50, iter: 400/834, loss: 0.24470, lr: 0.063556, top1: 0.76057, throughput: 312.80 | 2022-04-03 12:46:59.789 [rank:3] [train], epoch: 43/50, iter: 400/834, loss: 0.24412, lr: 0.063556, top1: 0.76052, throughput: 313.23 | 2022-04-03 12:46:59.799 [rank:1] [train], epoch: 43/50, iter: 400/834, loss: 0.24705, lr: 0.063556, top1: 0.75641, throughput: 313.09 | 2022-04-03 12:46:59.810 [rank:5] [train], epoch: 43/50, iter: 400/834, loss: 0.24546, lr: 0.063556, top1: 0.76047, throughput: 313.05 | 2022-04-03 12:46:59.820 [rank:6] [train], epoch: 43/50, iter: 400/834, loss: 0.24756, lr: 0.063556, top1: 0.75422, throughput: 313.25 | 2022-04-03 12:46:59.740 [rank:2] [train], epoch: 43/50, iter: 500/834, loss: 0.24499, lr: 0.061271, top1: 0.75630, throughput: 312.56 | 2022-04-03 12:48:01.207 [rank:1] [train], epoch: 43/50, iter: 500/834, loss: 0.24712, lr: 0.061271, top1: 0.75667, throughput: 312.71 | 2022-04-03 12:48:01.209 [rank:3] [train], epoch: 43/50, iter: 500/834, loss: 0.24423, lr: 0.061271, top1: 0.76104, throughput: 312.49 | 2022-04-03 12:48:01.240 [rank:5] [train], epoch: 43/50, iter: 500/834, loss: 0.24471, lr: 0.061271, top1: 0.76130, throughput: 312.58 | 2022-04-03 12:48:01.244 [rank:6] [train], epoch: 43/50, iter: 500/834, loss: 0.24571, lr: 0.061271, top1: 0.76073, throughput: 312.06 | 2022-04-03 12:48:01.266 [rank:0] [train], epoch: 43/50, iter: 500/834, loss: 0.24502, lr: 0.061271, top1: 0.76182, throughput: 312.27 | 2022-04-03 12:48:01.275 [rank:4] [train], epoch: 43/50, iter: 500/834, loss: 0.24486, lr: 0.061271, top1: 0.75703, throughput: 312.23 | 2022-04-03 12:48:01.282 [rank:7] [train], epoch: 43/50, iter: 500/834, loss: 0.24465, lr: 0.061271, top1: 0.76188, throughput: 311.90 | 2022-04-03 12:48:01.335 [rank:5] [train], epoch: 43/50, iter: 600/834, loss: 0.24700, lr: 0.059026, top1: 0.75615, throughput: 312.23 | 2022-04-03 12:49:02.737 [rank:2] [train], epoch: 43/50, iter: 600/834, loss: 0.24625, lr: 0.059026, top1: 0.75594, throughput: 311.99 | 2022-04-03 12:49:02.748 [rank:4] [train], epoch: 43/50, iter: 600/834, loss: 0.24592, lr: 0.059026, top1: 0.75911, throughput: 312.32 | 2022-04-03 12:49:02.758 [rank:7] [train], epoch: 43/50, iter: 600/834, loss: 0.24717, lr: 0.059026, top1: 0.75484, throughput: 312.57 | 2022-04-03 12:49:02.762 [rank:1] [train], epoch: 43/50, iter: 600/834, loss: 0.24800, lr: 0.059026, top1: 0.75219, throughput: 311.89 | 2022-04-03 12:49:02.769 [rank:6] [train], epoch: 43/50, iter: 600/834, loss: 0.24700, lr: 0.059026, top1: 0.75698, throughput: 312.04 | 2022-04-03 12:49:02.796 [rank:3] [train], epoch: 43/50, iter: 600/834, loss: 0.24537, lr: 0.059026, top1: 0.75833, throughput: 311.87 | 2022-04-03 12:49:02.803 [rank:0] [train], epoch: 43/50, iter: 600/834, loss: 0.24585, lr: 0.059026, top1: 0.76193, throughput: 311.98 | 2022-04-03 12:49:02.816 [rank:4] [train], epoch: 43/50, iter: 700/834, loss: 0.24569, lr: 0.056822, top1: 0.76099, throughput: 313.34 | 2022-04-03 12:50:04.034 [rank:1] [train], epoch: 43/50, iter: 700/834, loss: 0.24587, lr: 0.056822, top1: 0.75771, throughput: 313.25 | 2022-04-03 12:50:04.062 [rank:5] [train], epoch: 43/50, iter: 700/834, loss: 0.24521, lr: 0.056822, top1: 0.75969, throughput: 313.03 | 2022-04-03 12:50:04.073 [rank:7] [train], epoch: 43/50, iter: 700/834, loss: 0.24619, lr: 0.056822, top1: 0.75812, throughput: 313.09 | 2022-04-03 12:50:04.086 [rank:3] [train], epoch: 43/50, iter: 700/834, loss: 0.24694, lr: 0.056822, top1: 0.75818, throughput: 313.22 | 2022-04-03 12:50:04.102 [rank:6] [train], epoch: 43/50, iter: 700/834, loss: 0.24689, lr: 0.056822, top1: 0.75521, throughput: 313.13 | 2022-04-03 12:50:04.112 [rank:2] [train], epoch: 43/50, iter: 700/834, loss: 0.24342, lr: 0.056822, top1: 0.76172, throughput: 312.88 | 2022-04-03 12:50:04.113 [rank:0] [train], epoch: 43/50, iter: 700/834, loss: 0.24479, lr: 0.056822, top1: 0.75776, throughput: 313.09 | 2022-04-03 12:50:04.141 [rank:4] [train], epoch: 43/50, iter: 800/834, loss: 0.24669, lr: 0.054658, top1: 0.75411, throughput: 313.15 | 2022-04-03 12:51:05.347 [rank:3] [train], epoch: 43/50, iter: 800/834, loss: 0.24542, lr: 0.054658, top1: 0.75776, throughput: 313.49 | 2022-04-03 12:51:05.348 [rank:1] [train], epoch: 43/50, iter: 800/834, loss: 0.24521, lr: 0.054658, top1: 0.76193, throughput: 313.22 | 2022-04-03 12:51:05.361 [rank:6] [train], epoch: 43/50, iter: 800/834, loss: 0.24720, lr: 0.054658, top1: 0.75646, throughput: 313.41 | 2022-04-03 12:51:05.374 [rank:5] [train], epoch: 43/50, iter: 800/834, loss: 0.24750, lr: 0.054658, top1: 0.75214, throughput: 313.15 | 2022-04-03 12:51:05.386 [rank:2] [train], epoch: 43/50, iter: 800/834, loss: 0.24630, lr: 0.054658, top1: 0.75505, throughput: 313.25 | 2022-04-03 12:51:05.405 [rank:0] [train], epoch: 43/50, iter: 800/834, loss: 0.24546, lr: 0.054658, top1: 0.75818, throughput: 313.39 | 2022-04-03 12:51:05.406 [rank:7] [train], epoch: 43/50, iter: 800/834, loss: 0.24475, lr: 0.054658, top1: 0.76203, throughput: 313.11 | 2022-04-03 12:51:05.407 [rank:6] [train], epoch: 43/50, iter: 834/834, loss: 0.24785, lr: 0.053932, top1: 0.75260, throughput: 313.10 | 2022-04-03 12:51:26.224 [rank:5] [train], epoch: 43/50, iter: 834/834, loss: 0.24547, lr: 0.053932, top1: 0.75643, throughput: 313.25 | 2022-04-03 12:51:26.226 [rank:0] [train], epoch: 43/50, iter: 834/834, loss: 0.24279, lr: 0.053932, top1: 0.76930, throughput: 313.48 | 2022-04-03 12:51:26.231 [rank:3] [train], epoch: 43/50, iter: 834/834, loss: 0.24617, lr: 0.053932, top1: 0.75735, throughput: 312.58 | 2022-04-03 12:51:26.232 [rank:1] [train], epoch: 43/50, iter: 834/834, loss: 0.24364, lr: 0.053932, top1: 0.76011, throughput: 312.73 | 2022-04-03 12:51:26.235 [rank:2] [train], epoch: 43/50, iter: 834/834, loss: 0.24561, lr: 0.053932, top1: 0.75827, throughput: 313.38 | 2022-04-03 12:51:26.236 [rank:7] [train], epoch: 43/50, iter: 834/834, loss: 0.24662, lr: 0.053932, top1: 0.75521, throughput: 312.96 | 2022-04-03 12:51:26.266 [rank:4] [train], epoch: 43/50, iter: 834/834, loss: 0.24711, lr: 0.053932, top1: 0.75414, throughput: 311.92 | 2022-04-03 12:51:26.276 [rank:0] [eval], epoch: 43/50, iter: 125/125, loss: 0.00000, lr: 0.053932, top1: 0.75312, throughput: 494.67 | 2022-04-03 12:51:38.865 [rank:1] [eval], epoch: 43/50, iter: 125/125, loss: 0.00000, lr: 0.053932, top1: 0.75232, throughput: 494.71 | 2022-04-03 12:51:38.869 [rank:2] [eval], epoch: 43/50, iter: 125/125, loss: 0.00000, lr: 0.053932, top1: 0.73904, throughput: 494.56 | 2022-04-03 12:51:38.874 [rank:3] [eval], epoch: 43/50, iter: 125/125, loss: 0.00000, lr: 0.053932, top1: 0.74928, throughput: 494.37 | 2022-04-03 12:51:38.874 [rank:4] [eval], epoch: 43/50, iter: 125/125, loss: 0.00000, lr: 0.053932, top1: 0.74480, throughput: 495.83 | 2022-04-03 12:51:38.881 [rank:7] [eval], epoch: 43/50, iter: 125/125, loss: 0.00000, lr: 0.053932, top1: 0.75344, throughput: 495.33 | 2022-04-03 12:51:38.884 [rank:5] [eval], epoch: 43/50, iter: 125/125, loss: 0.00000, lr: 0.053932, top1: 0.74112, throughput: 493.03 | 2022-04-03 12:51:38.903 [rank:6] [eval], epoch: 43/50, iter: 125/125, loss: 0.00000, lr: 0.053932, top1: 0.75200, throughput: 492.23 | 2022-04-03 12:51:38.921 [rank:7] [train], epoch: 44/50, iter: 100/834, loss: 0.24310, lr: 0.051822, top1: 0.76380, throughput: 312.46 | 2022-04-03 12:52:40.332 [rank:6] [train], epoch: 44/50, iter: 100/834, loss: 0.24345, lr: 0.051822, top1: 0.76286, throughput: 312.54 | 2022-04-03 12:52:40.352 [rank:5] [train], epoch: 44/50, iter: 100/834, loss: 0.24221, lr: 0.051822, top1: 0.76443, throughput: 312.38 | 2022-04-03 12:52:40.367 [rank:2] [train], epoch: 44/50, iter: 100/834, loss: 0.24134, lr: 0.051822, top1: 0.76812, throughput: 312.19 | 2022-04-03 12:52:40.374 [rank:1] [train], epoch: 44/50, iter: 100/834, loss: 0.23899, lr: 0.051822, top1: 0.77505, throughput: 312.15 | 2022-04-03 12:52:40.379 [rank:3] [train], epoch: 44/50, iter: 100/834, loss: 0.24235, lr: 0.051822, top1: 0.76432, throughput: 312.17 | 2022-04-03 12:52:40.380 [rank:0] [train], epoch: 44/50, iter: 100/834, loss: 0.24062, lr: 0.051822, top1: 0.77323, throughput: 312.02 | 2022-04-03 12:52:40.400 [rank:4] [train], epoch: 44/50, iter: 100/834, loss: 0.24374, lr: 0.051822, top1: 0.76542, throughput: 311.98 | 2022-04-03 12:52:40.424 [rank:1] [train], epoch: 44/50, iter: 200/834, loss: 0.24064, lr: 0.049753, top1: 0.77000, throughput: 312.87 | 2022-04-03 12:53:41.746 [rank:3] [train], epoch: 44/50, iter: 200/834, loss: 0.24071, lr: 0.049753, top1: 0.76828, throughput: 312.86 | 2022-04-03 12:53:41.750 [rank:0] [train], epoch: 44/50, iter: 200/834, loss: 0.24233, lr: 0.049753, top1: 0.76594, throughput: 312.94 | 2022-04-03 12:53:41.754 [rank:5] [train], epoch: 44/50, iter: 200/834, loss: 0.24093, lr: 0.049753, top1: 0.76812, throughput: 312.73 | 2022-04-03 12:53:41.762 [rank:7] [train], epoch: 44/50, iter: 200/834, loss: 0.24083, lr: 0.049753, top1: 0.77016, throughput: 312.36 | 2022-04-03 12:53:41.799 [rank:6] [train], epoch: 44/50, iter: 200/834, loss: 0.24311, lr: 0.049753, top1: 0.76510, throughput: 312.45 | 2022-04-03 12:53:41.803 [rank:4] [train], epoch: 44/50, iter: 200/834, loss: 0.24346, lr: 0.049753, top1: 0.76234, throughput: 312.79 | 2022-04-03 12:53:41.806 [rank:2] [train], epoch: 44/50, iter: 200/834, loss: 0.24227, lr: 0.049753, top1: 0.76818, throughput: 312.38 | 2022-04-03 12:53:41.837 [rank:5] [train], epoch: 44/50, iter: 300/834, loss: 0.24036, lr: 0.047725, top1: 0.76797, throughput: 312.35 | 2022-04-03 12:54:43.232 [rank:7] [train], epoch: 44/50, iter: 300/834, loss: 0.24182, lr: 0.047725, top1: 0.76510, throughput: 312.50 | 2022-04-03 12:54:43.240 [rank:1] [train], epoch: 44/50, iter: 300/834, loss: 0.24173, lr: 0.047725, top1: 0.76740, throughput: 312.22 | 2022-04-03 12:54:43.240 [rank:4] [train], epoch: 44/50, iter: 300/834, loss: 0.24232, lr: 0.047725, top1: 0.76917, throughput: 312.42 | 2022-04-03 12:54:43.261 [rank:6] [train], epoch: 44/50, iter: 300/834, loss: 0.24124, lr: 0.047725, top1: 0.76896, throughput: 312.39 | 2022-04-03 12:54:43.264 [rank:3] [train], epoch: 44/50, iter: 300/834, loss: 0.24124, lr: 0.047725, top1: 0.77000, throughput: 311.94 | 2022-04-03 12:54:43.300 [rank:0] [train], epoch: 44/50, iter: 300/834, loss: 0.24105, lr: 0.047725, top1: 0.76656, throughput: 311.92 | 2022-04-03 12:54:43.309 [rank:2] [train], epoch: 44/50, iter: 300/834, loss: 0.24390, lr: 0.047725, top1: 0.76490, throughput: 312.23 | 2022-04-03 12:54:43.331 [rank:1] [train], epoch: 44/50, iter: 400/834, loss: 0.24341, lr: 0.045737, top1: 0.76516, throughput: 312.64 | 2022-04-03 12:55:44.653 [rank:2] [train], epoch: 44/50, iter: 400/834, loss: 0.24160, lr: 0.045737, top1: 0.76682, throughput: 313.07 | 2022-04-03 12:55:44.658 [rank:6] [train], epoch: 44/50, iter: 400/834, loss: 0.24177, lr: 0.045737, top1: 0.76542, throughput: 312.65 | 2022-04-03 12:55:44.674 [rank:5] [train], epoch: 44/50, iter: 400/834, loss: 0.24267, lr: 0.045737, top1: 0.76375, throughput: 312.49 | 2022-04-03 12:55:44.674 [rank:4] [train], epoch: 44/50, iter: 400/834, loss: 0.24061, lr: 0.045737, top1: 0.77125, throughput: 312.60 | 2022-04-03 12:55:44.681 [rank:3] [train], epoch: 44/50, iter: 400/834, loss: 0.24222, lr: 0.045737, top1: 0.76583, throughput: 312.77 | 2022-04-03 12:55:44.686 [rank:7] [train], epoch: 44/50, iter: 400/834, loss: 0.24248, lr: 0.045737, top1: 0.76661, throughput: 312.44 | 2022-04-03 12:55:44.691 [rank:0] [train], epoch: 44/50, iter: 400/834, loss: 0.24408, lr: 0.045737, top1: 0.76391, throughput: 312.74 | 2022-04-03 12:55:44.703 [rank:3] [train], epoch: 44/50, iter: 500/834, loss: 0.24193, lr: 0.043791, top1: 0.76583, throughput: 312.93 | 2022-04-03 12:56:46.042 [rank:4] [train], epoch: 44/50, iter: 500/834, loss: 0.24589, lr: 0.043791, top1: 0.75792, throughput: 312.71 | 2022-04-03 12:56:46.079 [rank:6] [train], epoch: 44/50, iter: 500/834, loss: 0.24250, lr: 0.043791, top1: 0.76672, throughput: 312.64 | 2022-04-03 12:56:46.087 [rank:0] [train], epoch: 44/50, iter: 500/834, loss: 0.24238, lr: 0.043791, top1: 0.76391, throughput: 312.78 | 2022-04-03 12:56:46.088 [rank:2] [train], epoch: 44/50, iter: 500/834, loss: 0.24273, lr: 0.043791, top1: 0.76661, throughput: 312.51 | 2022-04-03 12:56:46.096 [rank:5] [train], epoch: 44/50, iter: 500/834, loss: 0.24284, lr: 0.043791, top1: 0.76474, throughput: 312.59 | 2022-04-03 12:56:46.097 [rank:1] [train], epoch: 44/50, iter: 500/834, loss: 0.24142, lr: 0.043791, top1: 0.76609, throughput: 312.47 | 2022-04-03 12:56:46.100 [rank:7] [train], epoch: 44/50, iter: 500/834, loss: 0.24332, lr: 0.043791, top1: 0.76516, throughput: 312.99 | 2022-04-03 12:56:46.034 [rank:6] [train], epoch: 44/50, iter: 600/834, loss: 0.24189, lr: 0.041886, top1: 0.76813, throughput: 313.60 | 2022-04-03 12:57:47.311 [rank:1] [train], epoch: 44/50, iter: 600/834, loss: 0.24121, lr: 0.041886, top1: 0.76354, throughput: 313.58 | 2022-04-03 12:57:47.329 [rank:3] [train], epoch: 44/50, iter: 600/834, loss: 0.24258, lr: 0.041886, top1: 0.76255, throughput: 313.21 | 2022-04-03 12:57:47.342 [rank:2] [train], epoch: 44/50, iter: 600/834, loss: 0.24077, lr: 0.041886, top1: 0.77026, throughput: 313.43 | 2022-04-03 12:57:47.354 [rank:4] [train], epoch: 44/50, iter: 600/834, loss: 0.24217, lr: 0.041886, top1: 0.76333, throughput: 313.18 | 2022-04-03 12:57:47.385 [rank:5] [train], epoch: 44/50, iter: 600/834, loss: 0.24244, lr: 0.041886, top1: 0.76672, throughput: 313.23 | 2022-04-03 12:57:47.395 [rank:0] [train], epoch: 44/50, iter: 600/834, loss: 0.24234, lr: 0.041886, top1: 0.76714, throughput: 313.02 | 2022-04-03 12:57:47.426 [rank:7] [train], epoch: 44/50, iter: 600/834, loss: 0.24335, lr: 0.041886, top1: 0.76745, throughput: 312.74 | 2022-04-03 12:57:47.427 [rank:1] [train], epoch: 44/50, iter: 700/834, loss: 0.24240, lr: 0.040022, top1: 0.76734, throughput: 313.25 | 2022-04-03 12:58:48.622 [rank:3] [train], epoch: 44/50, iter: 700/834, loss: 0.24263, lr: 0.040022, top1: 0.76578, throughput: 313.28 | 2022-04-03 12:58:48.629 [rank:4] [train], epoch: 44/50, iter: 700/834, loss: 0.24145, lr: 0.040022, top1: 0.76599, throughput: 313.47 | 2022-04-03 12:58:48.635 [rank:5] [train], epoch: 44/50, iter: 700/834, loss: 0.24132, lr: 0.040022, top1: 0.76906, throughput: 313.48 | 2022-04-03 12:58:48.642 [rank:0] [train], epoch: 44/50, iter: 700/834, loss: 0.24125, lr: 0.040022, top1: 0.76839, throughput: 313.61 | 2022-04-03 12:58:48.648 [rank:6] [train], epoch: 44/50, iter: 700/834, loss: 0.24239, lr: 0.040022, top1: 0.76594, throughput: 312.99 | 2022-04-03 12:58:48.655 [rank:2] [train], epoch: 44/50, iter: 700/834, loss: 0.24207, lr: 0.040022, top1: 0.76854, throughput: 313.19 | 2022-04-03 12:58:48.660 [rank:7] [train], epoch: 44/50, iter: 700/834, loss: 0.24117, lr: 0.040022, top1: 0.76719, throughput: 313.51 | 2022-04-03 12:58:48.670 [rank:5] [train], epoch: 44/50, iter: 800/834, loss: 0.24247, lr: 0.038199, top1: 0.76672, throughput: 312.99 | 2022-04-03 12:59:49.986 [rank:2] [train], epoch: 44/50, iter: 800/834, loss: 0.23997, lr: 0.038199, top1: 0.77062, throughput: 312.94 | 2022-04-03 12:59:50.012 [rank:4] [train], epoch: 44/50, iter: 800/834, loss: 0.24054, lr: 0.038199, top1: 0.77167, throughput: 312.79 | 2022-04-03 12:59:50.019 [rank:0] [train], epoch: 44/50, iter: 800/834, loss: 0.24148, lr: 0.038199, top1: 0.77016, throughput: 312.79 | 2022-04-03 12:59:50.031 [rank:3] [train], epoch: 44/50, iter: 800/834, loss: 0.24257, lr: 0.038199, top1: 0.76292, throughput: 312.69 | 2022-04-03 12:59:50.032 [rank:1] [train], epoch: 44/50, iter: 800/834, loss: 0.24222, lr: 0.038199, top1: 0.76453, throughput: 312.57 | 2022-04-03 12:59:50.049 [rank:6] [train], epoch: 44/50, iter: 800/834, loss: 0.24098, lr: 0.038199, top1: 0.76865, throughput: 312.72 | 2022-04-03 12:59:50.052 [rank:7] [train], epoch: 44/50, iter: 800/834, loss: 0.24137, lr: 0.038199, top1: 0.76646, throughput: 312.71 | 2022-04-03 12:59:50.070 [rank:1] [train], epoch: 44/50, iter: 834/834, loss: 0.24155, lr: 0.037589, top1: 0.77175, throughput: 310.81 | 2022-04-03 13:00:11.052 [rank:2] [train], epoch: 44/50, iter: 834/834, loss: 0.24009, lr: 0.037589, top1: 0.76762, throughput: 310.08 | 2022-04-03 13:00:11.065 [rank:3] [train], epoch: 44/50, iter: 834/834, loss: 0.24250, lr: 0.037589, top1: 0.76731, throughput: 310.33 | 2022-04-03 13:00:11.067 [rank:4] [train], epoch: 44/50, iter: 834/834, loss: 0.24589, lr: 0.037589, top1: 0.75521, throughput: 310.07 | 2022-04-03 13:00:11.072 [rank:6] [train], epoch: 44/50, iter: 834/834, loss: 0.24615, lr: 0.037589, top1: 0.75337, throughput: 310.57 | 2022-04-03 13:00:11.072 [rank:0] [train], epoch: 44/50, iter: 834/834, loss: 0.23845, lr: 0.037589, top1: 0.77420, throughput: 310.03 | 2022-04-03 13:00:11.087 [rank:5] [train], epoch: 44/50, iter: 834/834, loss: 0.24347, lr: 0.037589, top1: 0.76149, throughput: 309.24 | 2022-04-03 13:00:11.096 [rank:7] [train], epoch: 44/50, iter: 834/834, loss: 0.24023, lr: 0.037589, top1: 0.77313, throughput: 310.36 | 2022-04-03 13:00:11.104 [rank:0] [eval], epoch: 44/50, iter: 125/125, loss: 0.00000, lr: 0.037589, top1: 0.75136, throughput: 491.46 | 2022-04-03 13:00:23.804 [rank:2] [eval], epoch: 44/50, iter: 125/125, loss: 0.00000, lr: 0.037589, top1: 0.74256, throughput: 490.44 | 2022-04-03 13:00:23.809 [rank:4] [eval], epoch: 44/50, iter: 125/125, loss: 0.00000, lr: 0.037589, top1: 0.74880, throughput: 490.24 | 2022-04-03 13:00:23.821 [rank:7] [eval], epoch: 44/50, iter: 125/125, loss: 0.00000, lr: 0.037589, top1: 0.75728, throughput: 491.21 | 2022-04-03 13:00:23.827 [rank:3] [eval], epoch: 44/50, iter: 125/125, loss: 0.00000, lr: 0.037589, top1: 0.75552, throughput: 489.75 | 2022-04-03 13:00:23.829 [rank:1] [eval], epoch: 44/50, iter: 125/125, loss: 0.00000, lr: 0.037589, top1: 0.75584, throughput: 488.38 | 2022-04-03 13:00:23.849 [rank:6] [eval], epoch: 44/50, iter: 125/125, loss: 0.00000, lr: 0.037589, top1: 0.75776, throughput: 488.89 | 2022-04-03 13:00:23.855 [rank:5] [eval], epoch: 44/50, iter: 125/125, loss: 0.00000, lr: 0.037589, top1: 0.74112, throughput: 489.73 | 2022-04-03 13:00:23.858 [rank:2] [train], epoch: 45/50, iter: 100/834, loss: 0.23890, lr: 0.035821, top1: 0.77422, throughput: 313.18 | 2022-04-03 13:01:25.116 [rank:7] [train], epoch: 45/50, iter: 100/834, loss: 0.23823, lr: 0.035821, top1: 0.77479, throughput: 313.20 | 2022-04-03 13:01:25.129 [rank:5] [train], epoch: 45/50, iter: 100/834, loss: 0.23864, lr: 0.035821, top1: 0.77375, throughput: 313.36 | 2022-04-03 13:01:25.130 [rank:0] [train], epoch: 45/50, iter: 100/834, loss: 0.23587, lr: 0.035821, top1: 0.78057, throughput: 313.04 | 2022-04-03 13:01:25.138 [rank:6] [train], epoch: 45/50, iter: 100/834, loss: 0.23947, lr: 0.035821, top1: 0.77104, throughput: 313.26 | 2022-04-03 13:01:25.147 [rank:1] [train], epoch: 45/50, iter: 100/834, loss: 0.23897, lr: 0.035821, top1: 0.77432, throughput: 313.16 | 2022-04-03 13:01:25.160 [rank:3] [train], epoch: 45/50, iter: 100/834, loss: 0.24071, lr: 0.035821, top1: 0.77063, throughput: 312.89 | 2022-04-03 13:01:25.192 [rank:4] [train], epoch: 45/50, iter: 100/834, loss: 0.23890, lr: 0.035821, top1: 0.77198, throughput: 312.81 | 2022-04-03 13:01:25.201 [rank:0] [train], epoch: 45/50, iter: 200/834, loss: 0.24082, lr: 0.034096, top1: 0.77328, throughput: 311.49 | 2022-04-03 13:02:26.776 [rank:5] [train], epoch: 45/50, iter: 200/834, loss: 0.23883, lr: 0.034096, top1: 0.77302, throughput: 311.26 | 2022-04-03 13:02:26.816 [rank:3] [train], epoch: 45/50, iter: 200/834, loss: 0.24003, lr: 0.034096, top1: 0.77125, throughput: 311.50 | 2022-04-03 13:02:26.830 [rank:4] [train], epoch: 45/50, iter: 200/834, loss: 0.23979, lr: 0.034096, top1: 0.76807, throughput: 311.35 | 2022-04-03 13:02:26.868 [rank:2] [train], epoch: 45/50, iter: 200/834, loss: 0.23946, lr: 0.034096, top1: 0.77089, throughput: 310.88 | 2022-04-03 13:02:26.875 [rank:7] [train], epoch: 45/50, iter: 200/834, loss: 0.23863, lr: 0.034096, top1: 0.77307, throughput: 310.94 | 2022-04-03 13:02:26.878 [rank:6] [train], epoch: 45/50, iter: 200/834, loss: 0.23582, lr: 0.034096, top1: 0.78104, throughput: 311.00 | 2022-04-03 13:02:26.884 [rank:1] [train], epoch: 45/50, iter: 200/834, loss: 0.23853, lr: 0.034096, top1: 0.77198, throughput: 311.01 | 2022-04-03 13:02:26.895 [rank:7] [train], epoch: 45/50, iter: 300/834, loss: 0.23961, lr: 0.032412, top1: 0.77005, throughput: 313.14 | 2022-04-03 13:03:28.191 [rank:6] [train], epoch: 45/50, iter: 300/834, loss: 0.23822, lr: 0.032412, top1: 0.77411, throughput: 313.16 | 2022-04-03 13:03:28.194 [rank:0] [train], epoch: 45/50, iter: 300/834, loss: 0.23728, lr: 0.032412, top1: 0.77745, throughput: 312.43 | 2022-04-03 13:03:28.229 [rank:2] [train], epoch: 45/50, iter: 300/834, loss: 0.23915, lr: 0.032412, top1: 0.77068, throughput: 312.93 | 2022-04-03 13:03:28.230 [rank:3] [train], epoch: 45/50, iter: 300/834, loss: 0.23885, lr: 0.032412, top1: 0.77339, throughput: 312.67 | 2022-04-03 13:03:28.237 [rank:1] [train], epoch: 45/50, iter: 300/834, loss: 0.23922, lr: 0.032412, top1: 0.77208, throughput: 312.99 | 2022-04-03 13:03:28.239 [rank:5] [train], epoch: 45/50, iter: 300/834, loss: 0.23930, lr: 0.032412, top1: 0.77068, throughput: 312.57 | 2022-04-03 13:03:28.242 [rank:4] [train], epoch: 45/50, iter: 300/834, loss: 0.23783, lr: 0.032412, top1: 0.77724, throughput: 312.82 | 2022-04-03 13:03:28.245 [rank:2] [train], epoch: 45/50, iter: 400/834, loss: 0.23756, lr: 0.030769, top1: 0.77776, throughput: 314.04 | 2022-04-03 13:04:29.370 [rank:4] [train], epoch: 45/50, iter: 400/834, loss: 0.23809, lr: 0.030769, top1: 0.77422, throughput: 314.11 | 2022-04-03 13:04:29.370 [rank:5] [train], epoch: 45/50, iter: 400/834, loss: 0.24097, lr: 0.030769, top1: 0.77068, throughput: 313.93 | 2022-04-03 13:04:29.402 [rank:1] [train], epoch: 45/50, iter: 400/834, loss: 0.23989, lr: 0.030769, top1: 0.77156, throughput: 313.88 | 2022-04-03 13:04:29.409 [rank:6] [train], epoch: 45/50, iter: 400/834, loss: 0.24203, lr: 0.030769, top1: 0.76432, throughput: 313.64 | 2022-04-03 13:04:29.411 [rank:3] [train], epoch: 45/50, iter: 400/834, loss: 0.23803, lr: 0.030769, top1: 0.77401, throughput: 313.81 | 2022-04-03 13:04:29.419 [rank:0] [train], epoch: 45/50, iter: 400/834, loss: 0.23984, lr: 0.030769, top1: 0.77417, throughput: 313.76 | 2022-04-03 13:04:29.422 [rank:7] [train], epoch: 45/50, iter: 400/834, loss: 0.23881, lr: 0.030769, top1: 0.77260, throughput: 313.92 | 2022-04-03 13:04:29.354 [rank:1] [train], epoch: 45/50, iter: 500/834, loss: 0.23851, lr: 0.029169, top1: 0.77464, throughput: 311.34 | 2022-04-03 13:05:31.079 [rank:7] [train], epoch: 45/50, iter: 500/834, loss: 0.24100, lr: 0.029169, top1: 0.76786, throughput: 311.03 | 2022-04-03 13:05:31.086 [rank:6] [train], epoch: 45/50, iter: 500/834, loss: 0.23887, lr: 0.029169, top1: 0.77078, throughput: 311.31 | 2022-04-03 13:05:31.086 [rank:5] [train], epoch: 45/50, iter: 500/834, loss: 0.23814, lr: 0.029169, top1: 0.77641, throughput: 311.25 | 2022-04-03 13:05:31.089 [rank:0] [train], epoch: 45/50, iter: 500/834, loss: 0.23860, lr: 0.029169, top1: 0.77474, throughput: 311.29 | 2022-04-03 13:05:31.101 [rank:3] [train], epoch: 45/50, iter: 500/834, loss: 0.24063, lr: 0.029169, top1: 0.76969, throughput: 311.16 | 2022-04-03 13:05:31.123 [rank:2] [train], epoch: 45/50, iter: 500/834, loss: 0.23807, lr: 0.029169, top1: 0.77859, throughput: 310.91 | 2022-04-03 13:05:31.125 [rank:4] [train], epoch: 45/50, iter: 500/834, loss: 0.24034, lr: 0.029169, top1: 0.77115, throughput: 310.85 | 2022-04-03 13:05:31.136 [rank:7] [train], epoch: 45/50, iter: 600/834, loss: 0.23894, lr: 0.027611, top1: 0.77505, throughput: 313.53 | 2022-04-03 13:06:32.323 [rank:2] [train], epoch: 45/50, iter: 600/834, loss: 0.23803, lr: 0.027611, top1: 0.77609, throughput: 313.55 | 2022-04-03 13:06:32.358 [rank:4] [train], epoch: 45/50, iter: 600/834, loss: 0.23892, lr: 0.027611, top1: 0.77276, throughput: 313.52 | 2022-04-03 13:06:32.376 [rank:5] [train], epoch: 45/50, iter: 600/834, loss: 0.23634, lr: 0.027611, top1: 0.78115, throughput: 313.23 | 2022-04-03 13:06:32.387 [rank:0] [train], epoch: 45/50, iter: 600/834, loss: 0.23803, lr: 0.027611, top1: 0.77661, throughput: 313.28 | 2022-04-03 13:06:32.388 [rank:6] [train], epoch: 45/50, iter: 600/834, loss: 0.23890, lr: 0.027611, top1: 0.77286, throughput: 313.20 | 2022-04-03 13:06:32.389 [rank:1] [train], epoch: 45/50, iter: 600/834, loss: 0.23934, lr: 0.027611, top1: 0.77005, throughput: 313.11 | 2022-04-03 13:06:32.399 [rank:3] [train], epoch: 45/50, iter: 600/834, loss: 0.23666, lr: 0.027611, top1: 0.77870, throughput: 313.22 | 2022-04-03 13:06:32.422 [rank:4] [train], epoch: 45/50, iter: 700/834, loss: 0.23827, lr: 0.026094, top1: 0.77516, throughput: 312.39 | 2022-04-03 13:07:33.838 [rank:1] [train], epoch: 45/50, iter: 700/834, loss: 0.23803, lr: 0.026094, top1: 0.77161, throughput: 312.41 | 2022-04-03 13:07:33.857 [rank:3] [train], epoch: 45/50, iter: 700/834, loss: 0.23861, lr: 0.026094, top1: 0.77312, throughput: 312.52 | 2022-04-03 13:07:33.858 [rank:6] [train], epoch: 45/50, iter: 700/834, loss: 0.23846, lr: 0.026094, top1: 0.77448, throughput: 312.29 | 2022-04-03 13:07:33.869 [rank:2] [train], epoch: 45/50, iter: 700/834, loss: 0.23807, lr: 0.026094, top1: 0.77557, throughput: 312.04 | 2022-04-03 13:07:33.890 [rank:0] [train], epoch: 45/50, iter: 700/834, loss: 0.23913, lr: 0.026094, top1: 0.77031, throughput: 312.10 | 2022-04-03 13:07:33.907 [rank:7] [train], epoch: 45/50, iter: 700/834, loss: 0.23957, lr: 0.026094, top1: 0.77531, throughput: 311.77 | 2022-04-03 13:07:33.907 [rank:5] [train], epoch: 45/50, iter: 700/834, loss: 0.23800, lr: 0.026094, top1: 0.77484, throughput: 312.07 | 2022-04-03 13:07:33.911 [rank:3] [train], epoch: 45/50, iter: 800/834, loss: 0.23958, lr: 0.024620, top1: 0.77234, throughput: 313.67 | 2022-04-03 13:08:35.069 [rank:1] [train], epoch: 45/50, iter: 800/834, loss: 0.24026, lr: 0.024620, top1: 0.76964, throughput: 313.57 | 2022-04-03 13:08:35.087 [rank:6] [train], epoch: 45/50, iter: 800/834, loss: 0.23938, lr: 0.024620, top1: 0.77438, throughput: 313.63 | 2022-04-03 13:08:35.088 [rank:4] [train], epoch: 45/50, iter: 800/834, loss: 0.23855, lr: 0.024620, top1: 0.77328, throughput: 313.41 | 2022-04-03 13:08:35.099 [rank:0] [train], epoch: 45/50, iter: 800/834, loss: 0.23911, lr: 0.024620, top1: 0.77469, throughput: 313.76 | 2022-04-03 13:08:35.100 [rank:5] [train], epoch: 45/50, iter: 800/834, loss: 0.23824, lr: 0.024620, top1: 0.77760, throughput: 313.77 | 2022-04-03 13:08:35.103 [rank:7] [train], epoch: 45/50, iter: 800/834, loss: 0.23913, lr: 0.024620, top1: 0.77021, throughput: 314.07 | 2022-04-03 13:08:35.041 [rank:2] [train], epoch: 45/50, iter: 800/834, loss: 0.23807, lr: 0.024620, top1: 0.77359, throughput: 313.47 | 2022-04-03 13:08:35.139 [rank:1] [train], epoch: 45/50, iter: 834/834, loss: 0.23835, lr: 0.024128, top1: 0.77374, throughput: 310.60 | 2022-04-03 13:08:56.104 [rank:5] [train], epoch: 45/50, iter: 834/834, loss: 0.23771, lr: 0.024128, top1: 0.77972, throughput: 310.84 | 2022-04-03 13:08:56.104 [rank:4] [train], epoch: 45/50, iter: 834/834, loss: 0.23979, lr: 0.024128, top1: 0.77589, throughput: 310.76 | 2022-04-03 13:08:56.106 [rank:6] [train], epoch: 45/50, iter: 834/834, loss: 0.23962, lr: 0.024128, top1: 0.77206, throughput: 310.45 | 2022-04-03 13:08:56.116 [rank:3] [train], epoch: 45/50, iter: 834/834, loss: 0.24024, lr: 0.024128, top1: 0.76547, throughput: 309.71 | 2022-04-03 13:08:56.147 [rank:2] [train], epoch: 45/50, iter: 834/834, loss: 0.24195, lr: 0.024128, top1: 0.76731, throughput: 310.73 | 2022-04-03 13:08:56.147 [rank:0] [train], epoch: 45/50, iter: 834/834, loss: 0.24327, lr: 0.024128, top1: 0.76961, throughput: 310.05 | 2022-04-03 13:08:56.155 [rank:7] [train], epoch: 45/50, iter: 834/834, loss: 0.23739, lr: 0.024128, top1: 0.78018, throughput: 309.14 | 2022-04-03 13:08:56.158 [rank:2] [eval], epoch: 45/50, iter: 125/125, loss: 0.00000, lr: 0.024128, top1: 0.74864, throughput: 496.17 | 2022-04-03 13:09:08.744 [rank:0] [eval], epoch: 45/50, iter: 125/125, loss: 0.00000, lr: 0.024128, top1: 0.76176, throughput: 496.47 | 2022-04-03 13:09:08.744 [rank:3] [eval], epoch: 45/50, iter: 125/125, loss: 0.00000, lr: 0.024128, top1: 0.76176, throughput: 495.68 | 2022-04-03 13:09:08.756 [rank:1] [eval], epoch: 45/50, iter: 125/125, loss: 0.00000, lr: 0.024128, top1: 0.76032, throughput: 493.91[rank:4] [eval], epoch: 45/50, iter: 125/125, loss: 0.00000, lr: 0.024128, top1: 0.75824, throughput: 493.97 | 2022-04-03 13:09:08.758| 2022-04-03 13:09:08.758 [rank:7] [eval], epoch: 45/50, iter: 125/125, loss: 0.00000, lr: 0.024128, top1: 0.76368, throughput: 495.64 | 2022-04-03 13:09:08.768 [rank:5] [eval], epoch: 45/50, iter: 125/125, loss: 0.00000, lr: 0.024128, top1: 0.74816, throughput: 493.34 | 2022-04-03 13:09:08.773 [rank:6] [eval], epoch: 45/50, iter: 125/125, loss: 0.00000, lr: 0.024128, top1: 0.76128, throughput: 492.54 | 2022-04-03 13:09:08.805 [rank:1] [train], epoch: 46/50, iter: 100/834, loss: 0.23715, lr: 0.022710, top1: 0.77958, throughput: 313.88 | 2022-04-03 13:10:09.927 [rank:3] [train], epoch: 46/50, iter: 100/834, loss: 0.23743, lr: 0.022710, top1: 0.77589, throughput: 313.80 | 2022-04-03 13:10:09.942 [rank:6] [train], epoch: 46/50, iter: 100/834, loss: 0.23786, lr: 0.022710, top1: 0.77578, throughput: 313.96 | 2022-04-03 13:10:09.959 [rank:0] [train], epoch: 46/50, iter: 100/834, loss: 0.23462, lr: 0.022710, top1: 0.78203, throughput: 313.64 | 2022-04-03 13:10:09.961 [rank:7] [train], epoch: 46/50, iter: 100/834, loss: 0.23482, lr: 0.022710, top1: 0.78328, throughput: 313.75 | 2022-04-03 13:10:09.962 [rank:4] [train], epoch: 46/50, iter: 100/834, loss: 0.23564, lr: 0.022710, top1: 0.78391, throughput: 313.69 | 2022-04-03 13:10:09.965 [rank:5] [train], epoch: 46/50, iter: 100/834, loss: 0.23651, lr: 0.022710, top1: 0.77937, throughput: 313.67 | 2022-04-03 13:10:09.984 [rank:2] [train], epoch: 46/50, iter: 100/834, loss: 0.23761, lr: 0.022710, top1: 0.77339, throughput: 313.48 | 2022-04-03 13:10:09.991 [rank:1] [train], epoch: 46/50, iter: 200/834, loss: 0.23379, lr: 0.021335, top1: 0.78604, throughput: 312.10 | 2022-04-03 13:11:11.446 [rank:7] [train], epoch: 46/50, iter: 200/834, loss: 0.23626, lr: 0.021335, top1: 0.78005, throughput: 312.23 | 2022-04-03 13:11:11.455 [rank:2] [train], epoch: 46/50, iter: 200/834, loss: 0.23542, lr: 0.021335, top1: 0.78078, throughput: 312.28 | 2022-04-03 13:11:11.475 [rank:6] [train], epoch: 46/50, iter: 200/834, loss: 0.23493, lr: 0.021335, top1: 0.78036, throughput: 312.11 | 2022-04-03 13:11:11.476 [rank:3] [train], epoch: 46/50, iter: 200/834, loss: 0.23632, lr: 0.021335, top1: 0.78052, throughput: 311.99 | 2022-04-03 13:11:11.482 [rank:4] [train], epoch: 46/50, iter: 200/834, loss: 0.23566, lr: 0.021335, top1: 0.77964, throughput: 312.10 | 2022-04-03 13:11:11.483 [rank:5] [train], epoch: 46/50, iter: 200/834, loss: 0.23569, lr: 0.021335, top1: 0.77969, throughput: 312.15 | 2022-04-03 13:11:11.492 [rank:0] [train], epoch: 46/50, iter: 200/834, loss: 0.23623, lr: 0.021335, top1: 0.77839, throughput: 311.97 | 2022-04-03 13:11:11.506 [rank:2] [train], epoch: 46/50, iter: 300/834, loss: 0.23530, lr: 0.020002, top1: 0.77865, throughput: 314.34 | 2022-04-03 13:12:12.556 [rank:4] [train], epoch: 46/50, iter: 300/834, loss: 0.23513, lr: 0.020002, top1: 0.77995, throughput: 314.29 | 2022-04-03 13:12:12.573 [rank:1] [train], epoch: 46/50, iter: 300/834, loss: 0.23685, lr: 0.020002, top1: 0.77792, throughput: 314.10 | 2022-04-03 13:12:12.574 [rank:6] [train], epoch: 46/50, iter: 300/834, loss: 0.23823, lr: 0.020002, top1: 0.77359, throughput: 314.21 | 2022-04-03 13:12:12.582 [rank:3] [train], epoch: 46/50, iter: 300/834, loss: 0.23465, lr: 0.020002, top1: 0.78167, throughput: 314.15 | 2022-04-03 13:12:12.599 [rank:7] [train], epoch: 46/50, iter: 300/834, loss: 0.23471, lr: 0.020002, top1: 0.78245, throughput: 313.84 | 2022-04-03 13:12:12.632 [rank:0] [train], epoch: 46/50, iter: 300/834, loss: 0.23565, lr: 0.020002, top1: 0.77922, throughput: 314.11 | 2022-04-03 13:12:12.632 [rank:5] [train], epoch: 46/50, iter: 300/834, loss: 0.23784, lr: 0.020002, top1: 0.77443, throughput: 314.00 | 2022-04-03 13:12:12.638 [rank:7] [train], epoch: 46/50, iter: 400/834, loss: 0.23697, lr: 0.018711, top1: 0.77870, throughput: 313.17 | 2022-04-03 13:13:13.941 [rank:1] [train], epoch: 46/50, iter: 400/834, loss: 0.23667, lr: 0.018711, top1: 0.78010, throughput: 312.78 | 2022-04-03 13:13:13.959 [rank:6] [train], epoch: 46/50, iter: 400/834, loss: 0.23603, lr: 0.018711, top1: 0.77724, throughput: 312.82 | 2022-04-03 13:13:13.959 [rank:4] [train], epoch: 46/50, iter: 400/834, loss: 0.23532, lr: 0.018711, top1: 0.77896, throughput: 312.73 | 2022-04-03 13:13:13.969 [rank:3] [train], epoch: 46/50, iter: 400/834, loss: 0.23417, lr: 0.018711, top1: 0.78224, throughput: 312.84 | 2022-04-03 13:13:13.973 [rank:2] [train], epoch: 46/50, iter: 400/834, loss: 0.23517, lr: 0.018711, top1: 0.78156, throughput: 312.57 | 2022-04-03 13:13:13.982 [rank:5] [train], epoch: 46/50, iter: 400/834, loss: 0.23656, lr: 0.018711, top1: 0.77573, throughput: 313.38 | 2022-04-03 13:13:13.906 [rank:0] [train], epoch: 46/50, iter: 400/834, loss: 0.23670, lr: 0.018711, top1: 0.78177, throughput: 312.83 | 2022-04-03 13:13:14.007 [rank:2] [train], epoch: 46/50, iter: 500/834, loss: 0.23440, lr: 0.017463, top1: 0.78047, throughput: 313.57 | 2022-04-03 13:14:15.212 [rank:0] [train], epoch: 46/50, iter: 500/834, loss: 0.23524, lr: 0.017463, top1: 0.77812, throughput: 313.60 | 2022-04-03 13:14:15.232 [rank:1] [train], epoch: 46/50, iter: 500/834, loss: 0.23819, lr: 0.017463, top1: 0.77516, throughput: 313.30 | 2022-04-03 13:14:15.244 [rank:7] [train], epoch: 46/50, iter: 500/834, loss: 0.23623, lr: 0.017463, top1: 0.77688, throughput: 313.19 | 2022-04-03 13:14:15.246 [rank:4] [train], epoch: 46/50, iter: 500/834, loss: 0.23516, lr: 0.017463, top1: 0.78266, throughput: 313.30[rank:6] [train], epoch: 46/50, iter: 500/834, loss: 0.23611, lr: 0.017463, top1: 0.77641, throughput: 313.25 | 2022-04-03 13:14:15.252 | 2022-04-03 13:14:15.252 [rank:5] [train], epoch: 46/50, iter: 500/834, loss: 0.23480, lr: 0.017463, top1: 0.78000, throughput: 312.96 | 2022-04-03 13:14:15.255 [rank:3] [train], epoch: 46/50, iter: 500/834, loss: 0.23573, lr: 0.017463, top1: 0.78005, throughput: 313.20 | 2022-04-03 13:14:15.277 [rank:3] [train], epoch: 46/50, iter: 600/834, loss: 0.23475, lr: 0.016257, top1: 0.78219, throughput: 311.93 | 2022-04-03 13:15:16.828 [rank:1] [train], epoch: 46/50, iter: 600/834, loss: 0.23564, lr: 0.016257, top1: 0.77781, throughput: 311.63 | 2022-04-03 13:15:16.854 [rank:5] [train], epoch: 46/50, iter: 600/834, loss: 0.23782, lr: 0.016257, top1: 0.77500, throughput: 311.63 | 2022-04-03 13:15:16.865 [rank:7] [train], epoch: 46/50, iter: 600/834, loss: 0.23626, lr: 0.016257, top1: 0.77786, throughput: 311.58 | 2022-04-03 13:15:16.866 [rank:2] [train], epoch: 46/50, iter: 600/834, loss: 0.23683, lr: 0.016257, top1: 0.77922, throughput: 311.37 | 2022-04-03 13:15:16.874 [rank:0] [train], epoch: 46/50, iter: 600/834, loss: 0.23722, lr: 0.016257, top1: 0.77573, throughput: 311.44 | 2022-04-03 13:15:16.881 [rank:4] [train], epoch: 46/50, iter: 600/834, loss: 0.23594, lr: 0.016257, top1: 0.78276, throughput: 311.47 | 2022-04-03 13:15:16.895 [rank:6] [train], epoch: 46/50, iter: 600/834, loss: 0.23559, lr: 0.016257, top1: 0.78062, throughput: 311.86 | 2022-04-03 13:15:16.818 [rank:5] [train], epoch: 46/50, iter: 700/834, loss: 0.23709, lr: 0.015095, top1: 0.77708, throughput: 312.38 | 2022-04-03 13:16:18.330 [rank:7] [train], epoch: 46/50, iter: 700/834, loss: 0.23730, lr: 0.015095, top1: 0.77823, throughput: 312.38 | 2022-04-03 13:16:18.330 [rank:0] [train], epoch: 46/50, iter: 700/834, loss: 0.23623, lr: 0.015095, top1: 0.78245, throughput: 312.37 | 2022-04-03 13:16:18.346 [rank:2] [train], epoch: 46/50, iter: 700/834, loss: 0.23611, lr: 0.015095, top1: 0.77854, throughput: 312.34 | 2022-04-03 13:16:18.346 [rank:4] [train], epoch: 46/50, iter: 700/834, loss: 0.23575, lr: 0.015095, top1: 0.78005, throughput: 312.37 | 2022-04-03 13:16:18.361 [rank:1] [train], epoch: 46/50, iter: 700/834, loss: 0.23692, lr: 0.015095, top1: 0.77422, throughput: 312.16 | 2022-04-03 13:16:18.362 [rank:3] [train], epoch: 46/50, iter: 700/834, loss: 0.23490, lr: 0.015095, top1: 0.78182, throughput: 312.02 | 2022-04-03 13:16:18.363 [rank:6] [train], epoch: 46/50, iter: 700/834, loss: 0.23537, lr: 0.015095, top1: 0.78250, throughput: 311.89 | 2022-04-03 13:16:18.377 [rank:6] [train], epoch: 46/50, iter: 800/834, loss: 0.23632, lr: 0.013974, top1: 0.77974, throughput: 313.30 | 2022-04-03 13:17:19.661 [rank:0] [train], epoch: 46/50, iter: 800/834, loss: 0.23600, lr: 0.013974, top1: 0.78250, throughput: 313.12 | 2022-04-03 13:17:19.665 [rank:3] [train], epoch: 46/50, iter: 800/834, loss: 0.23464, lr: 0.013974, top1: 0.78052, throughput: 313.17 | 2022-04-03 13:17:19.671 [rank:1] [train], epoch: 46/50, iter: 800/834, loss: 0.23770, lr: 0.013974, top1: 0.77802, throughput: 313.15 | 2022-04-03 13:17:19.674 [rank:7] [train], epoch: 46/50, iter: 800/834, loss: 0.23616, lr: 0.013974, top1: 0.77984, throughput: 312.92 | 2022-04-03 13:17:19.688 [rank:5] [train], epoch: 46/50, iter: 800/834, loss: 0.23359, lr: 0.013974, top1: 0.78318, throughput: 312.81 | 2022-04-03 13:17:19.709 [rank:4] [train], epoch: 46/50, iter: 800/834, loss: 0.23846, lr: 0.013974, top1: 0.77510, throughput: 312.86 | 2022-04-03 13:17:19.731 [rank:2] [train], epoch: 46/50, iter: 800/834, loss: 0.23441, lr: 0.013974, top1: 0.78297, throughput: 312.76 | 2022-04-03 13:17:19.735 [rank:6] [train], epoch: 46/50, iter: 834/834, loss: 0.23735, lr: 0.013603, top1: 0.77681, throughput: 314.52 | 2022-04-03 13:17:40.417 [rank:3] [train], epoch: 46/50, iter: 834/834, loss: 0.23573, lr: 0.013603, top1: 0.77114, throughput: 314.60 | 2022-04-03 13:17:40.422 [rank:2] [train], epoch: 46/50, iter: 834/834, loss: 0.23533, lr: 0.013603, top1: 0.78202, throughput: 315.55 | 2022-04-03 13:17:40.423 [rank:7] [train], epoch: 46/50, iter: 834/834, loss: 0.23568, lr: 0.013603, top1: 0.77849, throughput: 314.82 | 2022-04-03 13:17:40.424 [rank:1] [train], epoch: 46/50, iter: 834/834, loss: 0.23991, lr: 0.013603, top1: 0.76976, throughput: 314.60 | 2022-04-03 13:17:40.424 [rank:5] [train], epoch: 46/50, iter: 834/834, loss: 0.23784, lr: 0.013603, top1: 0.77696, throughput: 314.99 | 2022-04-03 13:17:40.433 [rank:4] [train], epoch: 46/50, iter: 834/834, loss: 0.23961, lr: 0.013603, top1: 0.77282, throughput: 315.15 | 2022-04-03 13:17:40.445 [rank:0] [train], epoch: 46/50, iter: 834/834, loss: 0.23335, lr: 0.013603, top1: 0.78217, throughput: 314.18 | 2022-04-03 13:17:40.443 [rank:0] [eval], epoch: 46/50, iter: 125/125, loss: 0.00000, lr: 0.013603, top1: 0.76240, throughput: 495.51 | 2022-04-03 13:17:53.056 [rank:2] [eval], epoch: 46/50, iter: 125/125, loss: 0.00000, lr: 0.013603, top1: 0.75680, throughput: 494.63 | 2022-04-03 13:17:53.058 [rank:1] [eval], epoch: 46/50, iter: 125/125, loss: 0.00000, lr: 0.013603, top1: 0.76464, throughput: 494.69 | 2022-04-03 13:17:53.059 [rank:3] [eval], epoch: 46/50, iter: 125/125, loss: 0.00000, lr: 0.013603, top1: 0.75920, throughput: 494.41 | 2022-04-03 13:17:53.063 [rank:4] [eval], epoch: 46/50, iter: 125/125, loss: 0.00000, lr: 0.013603, top1: 0.75952, throughput: 494.75 | 2022-04-03 13:17:53.077 [rank:7] [eval], epoch: 46/50, iter: 125/125, loss: 0.00000, lr: 0.013603, top1: 0.76560, throughput: 493.85 | 2022-04-03 13:17:53.079 [rank:5] [eval], epoch: 46/50, iter: 125/125, loss: 0.00000, lr: 0.013603, top1: 0.74960, throughput: 493.93 | 2022-04-03 13:17:53.087 [rank:6] [eval], epoch: 46/50, iter: 125/125, loss: 0.00000, lr: 0.013603, top1: 0.76512, throughput: 492.09 | 2022-04-03 13:17:53.118 [rank:3] [train], epoch: 47/50, iter: 100/834, loss: 0.23602, lr: 0.012541, top1: 0.77797, throughput: 311.45 | 2022-04-03 13:18:54.709 [rank:6] [train], epoch: 47/50, iter: 100/834, loss: 0.23602, lr: 0.012541, top1: 0.78109, throughput: 311.64 | 2022-04-03 13:18:54.727 [rank:1] [train], epoch: 47/50, iter: 100/834, loss: 0.23477, lr: 0.012541, top1: 0.78281, throughput: 311.22 | 2022-04-03 13:18:54.751 [rank:0] [train], epoch: 47/50, iter: 100/834, loss: 0.23503, lr: 0.012541, top1: 0.78010, throughput: 311.19 | 2022-04-03 13:18:54.755 [rank:2] [train], epoch: 47/50, iter: 100/834, loss: 0.23458, lr: 0.012541, top1: 0.78479, throughput: 311.12 | 2022-04-03 13:18:54.771 [rank:5] [train], epoch: 47/50, iter: 100/834, loss: 0.23343, lr: 0.012541, top1: 0.78672, throughput: 311.25 | 2022-04-03 13:18:54.773 [rank:4] [train], epoch: 47/50, iter: 100/834, loss: 0.23465, lr: 0.012541, top1: 0.78281, throughput: 311.12 | 2022-04-03 13:18:54.789 [rank:7] [train], epoch: 47/50, iter: 100/834, loss: 0.23410, lr: 0.012541, top1: 0.78318, throughput: 311.10 | 2022-04-03 13:18:54.796 [rank:7] [train], epoch: 47/50, iter: 200/834, loss: 0.23609, lr: 0.011521, top1: 0.78078, throughput: 311.48 | 2022-04-03 13:19:56.438 [rank:1] [train], epoch: 47/50, iter: 200/834, loss: 0.23381, lr: 0.011521, top1: 0.78448, throughput: 311.24 | 2022-04-03 13:19:56.440 [rank:5] [train], epoch: 47/50, iter: 200/834, loss: 0.23513, lr: 0.011521, top1: 0.78318, throughput: 311.34 | 2022-04-03 13:19:56.442 [rank:6] [train], epoch: 47/50, iter: 200/834, loss: 0.23373, lr: 0.011521, top1: 0.78833, throughput: 311.10 | 2022-04-03 13:19:56.444 [rank:4] [train], epoch: 47/50, iter: 200/834, loss: 0.23423, lr: 0.011521, top1: 0.78573, throughput: 311.42 | 2022-04-03 13:19:56.442 [rank:3] [train], epoch: 47/50, iter: 200/834, loss: 0.23481, lr: 0.011521, top1: 0.78370, throughput: 310.92 | 2022-04-03 13:19:56.462 [rank:2] [train], epoch: 47/50, iter: 200/834, loss: 0.23381, lr: 0.011521, top1: 0.78792, throughput: 311.21 | 2022-04-03 13:19:56.466 [rank:0] [train], epoch: 47/50, iter: 200/834, loss: 0.23266, lr: 0.011521, top1: 0.78719, throughput: 311.36 | 2022-04-03 13:19:56.419 [rank:1] [train], epoch: 47/50, iter: 300/834, loss: 0.23499, lr: 0.010544, top1: 0.78401, throughput: 312.38 | 2022-04-03 13:20:57.903 [rank:2] [train], epoch: 47/50, iter: 300/834, loss: 0.23332, lr: 0.010544, top1: 0.78505, throughput: 312.27 | 2022-04-03 13:20:57.950 [rank:7] [train], epoch: 47/50, iter: 300/834, loss: 0.23562, lr: 0.010544, top1: 0.77865, throughput: 312.09 | 2022-04-03 13:20:57.959 [rank:0] [train], epoch: 47/50, iter: 300/834, loss: 0.23578, lr: 0.010544, top1: 0.77990, throughput: 311.98 | 2022-04-03 13:20:57.962 [rank:4] [train], epoch: 47/50, iter: 300/834, loss: 0.23449, lr: 0.010544, top1: 0.78557, throughput: 311.96 | 2022-04-03 13:20:57.989 [rank:6] [train], epoch: 47/50, iter: 300/834, loss: 0.23446, lr: 0.010544, top1: 0.78380, throughput: 311.96 | 2022-04-03 13:20:57.991 [rank:3] [train], epoch: 47/50, iter: 300/834, loss: 0.23352, lr: 0.010544, top1: 0.78333, throughput: 312.02 | 2022-04-03 13:20:57.995 [rank:5] [train], epoch: 47/50, iter: 300/834, loss: 0.23473, lr: 0.010544, top1: 0.78250, throughput: 311.92 | 2022-04-03 13:20:57.996 [rank:0] [train], epoch: 47/50, iter: 400/834, loss: 0.23371, lr: 0.009610, top1: 0.78615, throughput: 311.67 | 2022-04-03 13:21:59.566 [rank:5] [train], epoch: 47/50, iter: 400/834, loss: 0.23254, lr: 0.009610, top1: 0.78552, throughput: 311.80 | 2022-04-03 13:21:59.575 [rank:2] [train], epoch: 47/50, iter: 400/834, loss: 0.23500, lr: 0.009610, top1: 0.78130, throughput: 311.56 | 2022-04-03 13:21:59.575 [rank:1] [train], epoch: 47/50, iter: 400/834, loss: 0.23333, lr: 0.009610, top1: 0.78589, throughput: 311.31 | 2022-04-03 13:21:59.579 [rank:3] [train], epoch: 47/50, iter: 400/834, loss: 0.23420, lr: 0.009610, top1: 0.78474, throughput: 311.68 | 2022-04-03 13:21:59.596 [rank:7] [train], epoch: 47/50, iter: 400/834, loss: 0.23385, lr: 0.009610, top1: 0.78208, throughput: 311.45 | 2022-04-03 13:21:59.606 [rank:4] [train], epoch: 47/50, iter: 400/834, loss: 0.23270, lr: 0.009610, top1: 0.78589, throughput: 311.60 | 2022-04-03 13:21:59.606 [rank:6] [train], epoch: 47/50, iter: 400/834, loss: 0.23442, lr: 0.009610, top1: 0.78062, throughput: 311.55 | 2022-04-03 13:21:59.619 [rank:5] [train], epoch: 47/50, iter: 500/834, loss: 0.23135, lr: 0.008719, top1: 0.79026, throughput: 313.34 | 2022-04-03 13:23:00.851 [rank:0] [train], epoch: 47/50, iter: 500/834, loss: 0.23486, lr: 0.008719, top1: 0.78172, throughput: 313.24 | 2022-04-03 13:23:00.861 [rank:6] [train], epoch: 47/50, iter: 500/834, loss: 0.23334, lr: 0.008719, top1: 0.78500, throughput: 313.36 | 2022-04-03 13:23:00.890 [rank:3] [train], epoch: 47/50, iter: 500/834, loss: 0.23554, lr: 0.008719, top1: 0.77995, throughput: 313.21 | 2022-04-03 13:23:00.898 [rank:7] [train], epoch: 47/50, iter: 500/834, loss: 0.23399, lr: 0.008719, top1: 0.78448, throughput: 313.24 | 2022-04-03 13:23:00.901 [rank:4] [train], epoch: 47/50, iter: 500/834, loss: 0.23382, lr: 0.008719, top1: 0.78448, throughput: 313.24 | 2022-04-03 13:23:00.901 [rank:2] [train], epoch: 47/50, iter: 500/834, loss: 0.23571, lr: 0.008719, top1: 0.78172, throughput: 312.92 | 2022-04-03 13:23:00.933 [rank:1] [train], epoch: 47/50, iter: 500/834, loss: 0.23324, lr: 0.008719, top1: 0.78531, throughput: 313.36 | 2022-04-03 13:23:00.850 [rank:3] [train], epoch: 47/50, iter: 600/834, loss: 0.23368, lr: 0.007871, top1: 0.78344, throughput: 313.98 | 2022-04-03 13:24:02.049 [rank:0] [train], epoch: 47/50, iter: 600/834, loss: 0.23379, lr: 0.007871, top1: 0.78635, throughput: 313.76 | 2022-04-03 13:24:02.054 [rank:2] [train], epoch: 47/50, iter: 600/834, loss: 0.23448, lr: 0.007871, top1: 0.78562, throughput: 314.08 | 2022-04-03 13:24:02.063 [rank:6] [train], epoch: 47/50, iter: 600/834, loss: 0.23258, lr: 0.007871, top1: 0.78740, throughput: 313.86 | 2022-04-03 13:24:02.064 [rank:7] [train], epoch: 47/50, iter: 600/834, loss: 0.23565, lr: 0.007871, top1: 0.77672, throughput: 313.74 | 2022-04-03 13:24:02.098 [rank:4] [train], epoch: 47/50, iter: 600/834, loss: 0.23472, lr: 0.007871, top1: 0.78469, throughput: 313.68 | 2022-04-03 13:24:02.110 [rank:5] [train], epoch: 47/50, iter: 600/834, loss: 0.23448, lr: 0.007871, top1: 0.78380, throughput: 313.41 | 2022-04-03 13:24:02.113 [rank:1] [train], epoch: 47/50, iter: 600/834, loss: 0.23422, lr: 0.007871, top1: 0.78203, throughput: 313.37 | 2022-04-03 13:24:02.121 [rank:7] [train], epoch: 47/50, iter: 700/834, loss: 0.23204, lr: 0.007066, top1: 0.78703, throughput: 314.39 | 2022-04-03 13:25:03.169 [rank:1] [train], epoch: 47/50, iter: 700/834, loss: 0.23444, lr: 0.007066, top1: 0.78260, throughput: 314.29 | 2022-04-03 13:25:03.210 [rank:5] [train], epoch: 47/50, iter: 700/834, loss: 0.23550, lr: 0.007066, top1: 0.78266, throughput: 314.22 | 2022-04-03 13:25:03.216 [rank:6] [train], epoch: 47/50, iter: 700/834, loss: 0.23233, lr: 0.007066, top1: 0.78781, throughput: 313.96 | 2022-04-03 13:25:03.219 [rank:2] [train], epoch: 47/50, iter: 700/834, loss: 0.23371, lr: 0.007066, top1: 0.78630, throughput: 313.94 | 2022-04-03 13:25:03.222 [rank:0] [train], epoch: 47/50, iter: 700/834, loss: 0.23494, lr: 0.007066, top1: 0.77990, throughput: 313.78 | 2022-04-03 13:25:03.244 [rank:4] [train], epoch: 47/50, iter: 700/834, loss: 0.23143, lr: 0.007066, top1: 0.79078, throughput: 313.99 | 2022-04-03 13:25:03.258 [rank:3] [train], epoch: 47/50, iter: 700/834, loss: 0.23220, lr: 0.007066, top1: 0.78948, throughput: 314.03 | 2022-04-03 13:25:03.191 [rank:0] [train], epoch: 47/50, iter: 800/834, loss: 0.23361, lr: 0.006305, top1: 0.78260, throughput: 312.88 | 2022-04-03 13:26:04.610 [rank:2] [train], epoch: 47/50, iter: 800/834, loss: 0.23329, lr: 0.006305, top1: 0.78589, throughput: 312.60 | 2022-04-03 13:26:04.642 [rank:3] [train], epoch: 47/50, iter: 800/834, loss: 0.23571, lr: 0.006305, top1: 0.77964, throughput: 312.40 | 2022-04-03 13:26:04.651 [rank:5] [train], epoch: 47/50, iter: 800/834, loss: 0.23272, lr: 0.006305, top1: 0.78479, throughput: 312.52 | 2022-04-03 13:26:04.651 [rank:6] [train], epoch: 47/50, iter: 800/834, loss: 0.23160, lr: 0.006305, top1: 0.78479, throughput: 312.44 | 2022-04-03 13:26:04.671 [rank:4] [train], epoch: 47/50, iter: 800/834, loss: 0.23286, lr: 0.006305, top1: 0.78500, throughput: 312.83 | 2022-04-03 13:26:04.634 [rank:7] [train], epoch: 47/50, iter: 800/834, loss: 0.23774, lr: 0.006305, top1: 0.77401, throughput: 312.33 | 2022-04-03 13:26:04.642 [rank:1] [train], epoch: 47/50, iter: 800/834, loss: 0.23311, lr: 0.006305, top1: 0.78620, throughput: 312.07 | 2022-04-03 13:26:04.736 [rank:5] [train], epoch: 47/50, iter: 834/834, loss: 0.23421, lr: 0.006056, top1: 0.78339, throughput: 312.75 | 2022-04-03 13:26:25.525 [rank:0] [train], epoch: 47/50, iter: 834/834, loss: 0.23623, lr: 0.006056, top1: 0.77972, throughput: 312.00 | 2022-04-03 13:26:25.533 [rank:6] [train], epoch: 47/50, iter: 834/834, loss: 0.23578, lr: 0.006056, top1: 0.78033, throughput: 312.85 | 2022-04-03 13:26:25.537 [rank:2] [train], epoch: 47/50, iter: 834/834, loss: 0.23429, lr: 0.006056, top1: 0.78768, throughput: 312.37 | 2022-04-03 13:26:25.540 [rank:1] [train], epoch: 47/50, iter: 834/834, loss: 0.23576, lr: 0.006056, top1: 0.78248, throughput: 313.78 | 2022-04-03 13:26:25.540 [rank:3] [train], epoch: 47/50, iter: 834/834, loss: 0.23414, lr: 0.006056, top1: 0.78753, throughput: 312.51 | 2022-04-03 13:26:25.539 [rank:7] [train], epoch: 47/50, iter: 834/834, loss: 0.23301, lr: 0.006056, top1: 0.78554, throughput: 312.31 | 2022-04-03 13:26:25.544 [rank:4] [train], epoch: 47/50, iter: 834/834, loss: 0.23242, lr: 0.006056, top1: 0.78845, throughput: 312.01 | 2022-04-03 13:26:25.556 [rank:0] [eval], epoch: 47/50, iter: 125/125, loss: 0.00000, lr: 0.006056, top1: 0.76112, throughput: 491.24 | 2022-04-03 13:26:38.256 [rank:3] [eval], epoch: 47/50, iter: 125/125, loss: 0.00000, lr: 0.006056, top1: 0.75856, throughput: 491.31 | 2022-04-03 13:26:38.260 [rank:4] [eval], epoch: 47/50, iter: 125/125, loss: 0.00000, lr: 0.006056, top1: 0.76368, throughput: 491.66 | 2022-04-03 13:26:38.268 [rank:7] [eval], epoch: 47/50, iter: 125/125, loss: 0.00000, lr: 0.006056, top1: 0.76736, throughput: 490.44 | 2022-04-03 13:26:38.288 [rank:2] [eval], epoch: 47/50, iter: 125/125, loss: 0.00000, lr: 0.006056, top1: 0.75568, throughput: 489.85 | 2022-04-03 13:26:38.299 [rank:5] [eval], epoch: 47/50, iter: 125/125, loss: 0.00000, lr: 0.006056, top1: 0.74944, throughput: 488.34 | 2022-04-03 13:26:38.323 [rank:1] [eval], epoch: 47/50, iter: 125/125, loss: 0.00000, lr: 0.006056, top1: 0.76560, throughput: 487.91 | 2022-04-03 13:26:38.350 [rank:6] [eval], epoch: 47/50, iter: 125/125, loss: 0.00000, lr: 0.006056, top1: 0.76432, throughput: 486.91 | 2022-04-03 13:26:38.373 [rank:3] [train], epoch: 48/50, iter: 100/834, loss: 0.23350, lr: 0.005352, top1: 0.78839, throughput: 312.80 | 2022-04-03 13:27:39.641 [rank:4] [train], epoch: 48/50, iter: 100/834, loss: 0.23275, lr: 0.005352, top1: 0.78734, throughput: 312.78 | 2022-04-03 13:27:39.653 [rank:7] [train], epoch: 48/50, iter: 100/834, loss: 0.23352, lr: 0.005352, top1: 0.78698, throughput: 312.87 | 2022-04-03 13:27:39.655 [rank:6] [train], epoch: 48/50, iter: 100/834, loss: 0.23473, lr: 0.005352, top1: 0.78365, throughput: 313.27 | 2022-04-03 13:27:39.662 [rank:1] [train], epoch: 48/50, iter: 100/834, loss: 0.23355, lr: 0.005352, top1: 0.78385, throughput: 313.14 | 2022-04-03 13:27:39.664 [rank:2] [train], epoch: 48/50, iter: 100/834, loss: 0.23404, lr: 0.005352, top1: 0.78104, throughput: 312.72 | 2022-04-03 13:27:39.695 [rank:5] [train], epoch: 48/50, iter: 100/834, loss: 0.23395, lr: 0.005352, top1: 0.78521, throughput: 312.78 | 2022-04-03 13:27:39.708 [rank:0] [train], epoch: 48/50, iter: 100/834, loss: 0.23249, lr: 0.005352, top1: 0.78573, throughput: 312.34 | 2022-04-03 13:27:39.727 [rank:6] [train], epoch: 48/50, iter: 200/834, loss: 0.23319, lr: 0.004692, top1: 0.78667, throughput: 311.77 | 2022-04-03 13:28:41.246 [rank:4] [train], epoch: 48/50, iter: 200/834, loss: 0.23277, lr: 0.004692, top1: 0.78885, throughput: 311.72 | 2022-04-03 13:28:41.246 [rank:5] [train], epoch: 48/50, iter: 200/834, loss: 0.23054, lr: 0.004692, top1: 0.79266, throughput: 311.98 | 2022-04-03 13:28:41.251 [rank:0] [train], epoch: 48/50, iter: 200/834, loss: 0.23007, lr: 0.004692, top1: 0.79229, throughput: 312.01 | 2022-04-03 13:28:41.265 [rank:7] [train], epoch: 48/50, iter: 200/834, loss: 0.23203, lr: 0.004692, top1: 0.78813, throughput: 311.64 | 2022-04-03 13:28:41.265 [rank:2] [train], epoch: 48/50, iter: 200/834, loss: 0.23464, lr: 0.004692, top1: 0.78182, throughput: 311.77 | 2022-04-03 13:28:41.278 [rank:1] [train], epoch: 48/50, iter: 200/834, loss: 0.23358, lr: 0.004692, top1: 0.78198, throughput: 311.59 | 2022-04-03 13:28:41.284 [rank:3] [train], epoch: 48/50, iter: 200/834, loss: 0.23317, lr: 0.004692, top1: 0.79078, throughput: 311.36 | 2022-04-03 13:28:41.306 [rank:2] [train], epoch: 48/50, iter: 300/834, loss: 0.23203, lr: 0.004075, top1: 0.78536, throughput: 312.61 | 2022-04-03 13:29:42.696 [rank:1] [train], epoch: 48/50, iter: 300/834, loss: 0.23137, lr: 0.004075, top1: 0.78708, throughput: 312.54 | 2022-04-03 13:29:42.717 [rank:7] [train], epoch: 48/50, iter: 300/834, loss: 0.23280, lr: 0.004075, top1: 0.78646, throughput: 312.38 | 2022-04-03 13:29:42.729 [rank:6] [train], epoch: 48/50, iter: 300/834, loss: 0.23283, lr: 0.004075, top1: 0.78557, throughput: 312.17 | 2022-04-03 13:29:42.751 [rank:5] [train], epoch: 48/50, iter: 300/834, loss: 0.23236, lr: 0.004075, top1: 0.78615, throughput: 312.19 | 2022-04-03 13:29:42.752 [rank:4] [train], epoch: 48/50, iter: 300/834, loss: 0.23525, lr: 0.004075, top1: 0.78224, throughput: 312.09 | 2022-04-03 13:29:42.766 [rank:3] [train], epoch: 48/50, iter: 300/834, loss: 0.23259, lr: 0.004075, top1: 0.78635, throughput: 312.37 | 2022-04-03 13:29:42.771 [rank:0] [train], epoch: 48/50, iter: 300/834, loss: 0.23046, lr: 0.004075, top1: 0.78917, throughput: 312.15 | 2022-04-03 13:29:42.772 [rank:7] [train], epoch: 48/50, iter: 400/834, loss: 0.23405, lr: 0.003502, top1: 0.78052, throughput: 313.76 | 2022-04-03 13:30:43.921 [rank:2] [train], epoch: 48/50, iter: 400/834, loss: 0.23278, lr: 0.003502, top1: 0.78703, throughput: 313.51 | 2022-04-03 13:30:43.937 [rank:0] [train], epoch: 48/50, iter: 400/834, loss: 0.23335, lr: 0.003502, top1: 0.78911, throughput: 313.85 | 2022-04-03 13:30:43.947 [rank:3] [train], epoch: 48/50, iter: 400/834, loss: 0.23173, lr: 0.003502, top1: 0.78854, throughput: 313.78 | 2022-04-03 13:30:43.961 [rank:5] [train], epoch: 48/50, iter: 400/834, loss: 0.23383, lr: 0.003502, top1: 0.78323, throughput: 313.63 | 2022-04-03 13:30:43.971 [rank:1] [train], epoch: 48/50, iter: 400/834, loss: 0.23069, lr: 0.003502, top1: 0.79010, throughput: 313.42 | 2022-04-03 13:30:43.976 [rank:6] [train], epoch: 48/50, iter: 400/834, loss: 0.23099, lr: 0.003502, top1: 0.79000, throughput: 313.58 | 2022-04-03 13:30:43.979 [rank:4] [train], epoch: 48/50, iter: 400/834, loss: 0.23419, lr: 0.003502, top1: 0.78432, throughput: 313.46 | 2022-04-03 13:30:44.017 [rank:3] [train], epoch: 48/50, iter: 500/834, loss: 0.23318, lr: 0.002971, top1: 0.78531, throughput: 313.73 | 2022-04-03 13:31:45.161 [rank:6] [train], epoch: 48/50, iter: 500/834, loss: 0.23044, lr: 0.002971, top1: 0.78911, throughput: 313.80 | 2022-04-03 13:31:45.164 [rank:2] [train], epoch: 48/50, iter: 500/834, loss: 0.23350, lr: 0.002971, top1: 0.78526, throughput: 313.48 | 2022-04-03 13:31:45.185 [rank:7] [train], epoch: 48/50, iter: 500/834, loss: 0.23287, lr: 0.002971, top1: 0.78708, throughput: 313.29 | 2022-04-03 13:31:45.207 [rank:1] [train], epoch: 48/50, iter: 500/834, loss: 0.23383, lr: 0.002971, top1: 0.78479, throughput: 313.51 | 2022-04-03 13:31:45.218 [rank:0] [train], epoch: 48/50, iter: 500/834, loss: 0.23536, lr: 0.002971, top1: 0.78089, throughput: 313.31 | 2022-04-03 13:31:45.228 [rank:5] [train], epoch: 48/50, iter: 500/834, loss: 0.23362, lr: 0.002971, top1: 0.78677, throughput: 313.39 | 2022-04-03 13:31:45.237 [rank:4] [train], epoch: 48/50, iter: 500/834, loss: 0.23260, lr: 0.002971, top1: 0.78620, throughput: 313.57 | 2022-04-03 13:31:45.247 [rank:7] [train], epoch: 48/50, iter: 600/834, loss: 0.23236, lr: 0.002485, top1: 0.78844, throughput: 312.52 | 2022-04-03 13:32:46.644 [rank:2] [train], epoch: 48/50, iter: 600/834, loss: 0.23227, lr: 0.002485, top1: 0.78740, throughput: 312.19 | 2022-04-03 13:32:46.687 [rank:6] [train], epoch: 48/50, iter: 600/834, loss: 0.23380, lr: 0.002485, top1: 0.78536, throughput: 312.02 | 2022-04-03 13:32:46.699 [rank:4] [train], epoch: 48/50, iter: 600/834, loss: 0.23169, lr: 0.002485, top1: 0.78938, throughput: 312.41 | 2022-04-03 13:32:46.705 [rank:3] [train], epoch: 48/50, iter: 600/834, loss: 0.23299, lr: 0.002485, top1: 0.78432, throughput: 311.88 | 2022-04-03 13:32:46.723 [rank:0] [train], epoch: 48/50, iter: 600/834, loss: 0.23235, lr: 0.002485, top1: 0.79083, throughput: 312.16 | 2022-04-03 13:32:46.734 [rank:5] [train], epoch: 48/50, iter: 600/834, loss: 0.23325, lr: 0.002485, top1: 0.78438, throughput: 312.10 | 2022-04-03 13:32:46.756 [rank:1] [train], epoch: 48/50, iter: 600/834, loss: 0.23337, lr: 0.002485, top1: 0.78594, throughput: 311.98 | 2022-04-03 13:32:46.760 [rank:2] [train], epoch: 48/50, iter: 700/834, loss: 0.23405, lr: 0.002041, top1: 0.78396, throughput: 313.26 | 2022-04-03 13:33:47.978 [rank:5] [train], epoch: 48/50, iter: 700/834, loss: 0.23294, lr: 0.002041, top1: 0.79036, throughput: 313.55 | 2022-04-03 13:33:47.990 [rank:7] [train], epoch: 48/50, iter: 700/834, loss: 0.23089, lr: 0.002041, top1: 0.79094, throughput: 312.92 | 2022-04-03 13:33:48.002 [rank:6] [train], epoch: 48/50, iter: 700/834, loss: 0.23171, lr: 0.002041, top1: 0.78906, throughput: 313.19 | 2022-04-03 13:33:48.003 [rank:1] [train], epoch: 48/50, iter: 700/834, loss: 0.23289, lr: 0.002041, top1: 0.78505, throughput: 313.45 | 2022-04-03 13:33:48.013 [rank:3] [train], epoch: 48/50, iter: 700/834, loss: 0.23340, lr: 0.002041, top1: 0.78599, throughput: 313.18 | 2022-04-03 13:33:48.029 [rank:4] [train], epoch: 48/50, iter: 700/834, loss: 0.23296, lr: 0.002041, top1: 0.78568, throughput: 313.03 | 2022-04-03 13:33:48.041 [rank:0] [train], epoch: 48/50, iter: 700/834, loss: 0.23285, lr: 0.002041, top1: 0.78703, throughput: 313.13 | 2022-04-03 13:33:48.050 [rank:2] [train], epoch: 48/50, iter: 800/834, loss: 0.23179, lr: 0.001642, top1: 0.78760, throughput: 311.37 | 2022-04-03 13:34:49.641 [rank:5] [train], epoch: 48/50, iter: 800/834, loss: 0.23298, lr: 0.001642, top1: 0.78698, throughput: 311.25 | 2022-04-03 13:34:49.676 [rank:0] [train], epoch: 48/50, iter: 800/834, loss: 0.23126, lr: 0.001642, top1: 0.78906, throughput: 311.51 | 2022-04-03 13:34:49.686 [rank:6] [train], epoch: 48/50, iter: 800/834, loss: 0.23121, lr: 0.001642, top1: 0.78802, throughput: 311.16 | 2022-04-03 13:34:49.707 [rank:1] [train], epoch: 48/50, iter: 800/834, loss: 0.23221, lr: 0.001642, top1: 0.78552, throughput: 311.17 | 2022-04-03 13:34:49.715 [rank:3] [train], epoch: 48/50, iter: 800/834, loss: 0.23193, lr: 0.001642, top1: 0.78880, throughput: 311.25 | 2022-04-03 13:34:49.716 [rank:7] [train], epoch: 48/50, iter: 800/834, loss: 0.22938, lr: 0.001642, top1: 0.79411, throughput: 311.10 | 2022-04-03 13:34:49.718 [rank:4] [train], epoch: 48/50, iter: 800/834, loss: 0.23145, lr: 0.001642, top1: 0.79042, throughput: 311.18 | 2022-04-03 13:34:49.741 [rank:2] [train], epoch: 48/50, iter: 834/834, loss: 0.23262, lr: 0.001515, top1: 0.78171, throughput: 312.09 | 2022-04-03 13:35:10.558 [rank:7] [train], epoch: 48/50, iter: 834/834, loss: 0.23426, lr: 0.001515, top1: 0.77895, throughput: 313.21 | 2022-04-03 13:35:10.560 [rank:3] [train], epoch: 48/50, iter: 834/834, loss: 0.23281, lr: 0.001515, top1: 0.78906, throughput: 313.10 | 2022-04-03 13:35:10.565 [rank:0] [train], epoch: 48/50, iter: 834/834, loss: 0.23161, lr: 0.001515, top1: 0.78339, throughput: 312.63 | 2022-04-03 13:35:10.567 [rank:5] [train], epoch: 48/50, iter: 834/834, loss: 0.23260, lr: 0.001515, top1: 0.78722, throughput: 312.48 | 2022-04-03 13:35:10.568 [rank:6] [train], epoch: 48/50, iter: 834/834, loss: 0.23155, lr: 0.001515, top1: 0.78998, throughput: 312.48 | 2022-04-03 13:35:10.598 [rank:4] [train], epoch: 48/50, iter: 834/834, loss: 0.23350, lr: 0.001515, top1: 0.78615, throughput: 312.80 | 2022-04-03 13:35:10.611 [rank:1] [train], epoch: 48/50, iter: 834/834, loss: 0.23088, lr: 0.001515, top1: 0.79274, throughput: 312.38 | 2022-04-03 13:35:10.612 [rank:0] [eval], epoch: 48/50, iter: 125/125, loss: 0.00000, lr: 0.001515, top1: 0.76624, throughput: 492.29 | 2022-04-03 13:35:23.263 [rank:7] [eval], epoch: 48/50, iter: 125/125, loss: 0.00000, lr: 0.001515, top1: 0.76768, throughput: 491.28 | 2022-04-03 13:35:23.282 [rank:3] [eval], epoch: 48/50, iter: 125/125, loss: 0.00000, lr: 0.001515, top1: 0.75968, throughput: 491.37 | 2022-04-03 13:35:23.285 [rank:4] [eval], epoch: 48/50, iter: 125/125, loss: 0.00000, lr: 0.001515, top1: 0.76368, throughput: 493.13 | 2022-04-03 13:35:23.285 [rank:2] [eval], epoch: 48/50, iter: 125/125, loss: 0.00000, lr: 0.001515, top1: 0.75472, throughput: 490.04 | 2022-04-03 13:35:23.312 [rank:5] [eval], epoch: 48/50, iter: 125/125, loss: 0.00000, lr: 0.001515, top1: 0.75232, throughput: 490.38 | 2022-04-03 13:35:23.313 [rank:1] [eval], epoch: 48/50, iter: 125/125, loss: 0.00000, lr: 0.001515, top1: 0.76784, throughput: 491.29 | 2022-04-03 13:35:23.334 [rank:6] [eval], epoch: 48/50, iter: 125/125, loss: 0.00000, lr: 0.001515, top1: 0.76432, throughput: 488.95 | 2022-04-03 13:35:23.381 [rank:6] [train], epoch: 49/50, iter: 100/834, loss: 0.23273, lr: 0.001174, top1: 0.78911, throughput: 313.44 | 2022-04-03 13:36:24.637 [rank:1] [train], epoch: 49/50, iter: 100/834, loss: 0.23280, lr: 0.001174, top1: 0.79000, throughput: 312.99 | 2022-04-03 13:36:24.679 [rank:2] [train], epoch: 49/50, iter: 100/834, loss: 0.23167, lr: 0.001174, top1: 0.78786, throughput: 312.87 | 2022-04-03 13:36:24.680 [rank:3] [train], epoch: 49/50, iter: 100/834, loss: 0.23403, lr: 0.001174, top1: 0.78516, throughput: 312.73 | 2022-04-03 13:36:24.680 [rank:0] [train], epoch: 49/50, iter: 100/834, loss: 0.23212, lr: 0.001174, top1: 0.78870, throughput: 312.61 | 2022-04-03 13:36:24.680 [rank:7] [train], epoch: 49/50, iter: 100/834, loss: 0.23117, lr: 0.001174, top1: 0.79109, throughput: 312.68 | 2022-04-03 13:36:24.686 [rank:4] [train], epoch: 49/50, iter: 100/834, loss: 0.23177, lr: 0.001174, top1: 0.78792, throughput: 312.67 | 2022-04-03 13:36:24.692 [rank:5] [train], epoch: 49/50, iter: 100/834, loss: 0.23220, lr: 0.001174, top1: 0.79203, throughput: 312.78 | 2022-04-03 13:36:24.697 [rank:3] [train], epoch: 49/50, iter: 200/834, loss: 0.23268, lr: 0.000876, top1: 0.78891, throughput: 313.09 | 2022-04-03 13:37:26.005 [rank:7] [train], epoch: 49/50, iter: 200/834, loss: 0.23172, lr: 0.000876, top1: 0.78802, throughput: 313.02 | 2022-04-03 13:37:26.023 [rank:1] [train], epoch: 49/50, iter: 200/834, loss: 0.23291, lr: 0.000876, top1: 0.78766, throughput: 312.98 | 2022-04-03 13:37:26.024 [rank:4] [train], epoch: 49/50, iter: 200/834, loss: 0.23094, lr: 0.000876, top1: 0.78859, throughput: 312.89 | 2022-04-03 13:37:26.056 [rank:6] [train], epoch: 49/50, iter: 200/834, loss: 0.23146, lr: 0.000876, top1: 0.78750, throughput: 312.57 | 2022-04-03 13:37:26.062 [rank:0] [train], epoch: 49/50, iter: 200/834, loss: 0.23361, lr: 0.000876, top1: 0.78698, throughput: 312.78 | 2022-04-03 13:37:26.066 [rank:5] [train], epoch: 49/50, iter: 200/834, loss: 0.23044, lr: 0.000876, top1: 0.79099, throughput: 312.80 | 2022-04-03 13:37:26.078 [rank:2] [train], epoch: 49/50, iter: 200/834, loss: 0.23394, lr: 0.000876, top1: 0.78500, throughput: 312.57 | 2022-04-03 13:37:26.105 [rank:5] [train], epoch: 49/50, iter: 300/834, loss: 0.23112, lr: 0.000621, top1: 0.78646, throughput: 315.21 | 2022-04-03 13:38:26.990 [rank:4] [train], epoch: 49/50, iter: 300/834, loss: 0.23169, lr: 0.000621, top1: 0.79255, throughput: 315.07 | 2022-04-03 13:38:26.995 [rank:2] [train], epoch: 49/50, iter: 300/834, loss: 0.23178, lr: 0.000621, top1: 0.78453, throughput: 315.22 | 2022-04-03 13:38:27.014 [rank:1] [train], epoch: 49/50, iter: 300/834, loss: 0.23258, lr: 0.000621, top1: 0.78406, throughput: 314.76 | 2022-04-03 13:38:27.023 [rank:7] [train], epoch: 49/50, iter: 300/834, loss: 0.23238, lr: 0.000621, top1: 0.79146, throughput: 314.69 | 2022-04-03 13:38:27.035 [rank:6] [train], epoch: 49/50, iter: 300/834, loss: 0.23363, lr: 0.000621, top1: 0.78474, throughput: 314.87 | 2022-04-03 13:38:27.040 [rank:3] [train], epoch: 49/50, iter: 300/834, loss: 0.23167, lr: 0.000621, top1: 0.78729, throughput: 314.56 | 2022-04-03 13:38:27.043 [rank:0] [train], epoch: 49/50, iter: 300/834, loss: 0.23164, lr: 0.000621, top1: 0.79068, throughput: 315.22 | 2022-04-03 13:38:26.976 [rank:0] [train], epoch: 49/50, iter: 400/834, loss: 0.23175, lr: 0.000410, top1: 0.79036, throughput: 313.12 | 2022-04-03 13:39:28.294 [rank:1] [train], epoch: 49/50, iter: 400/834, loss: 0.23303, lr: 0.000410, top1: 0.78714, throughput: 313.33 | 2022-04-03 13:39:28.301 [rank:2] [train], epoch: 49/50, iter: 400/834, loss: 0.23123, lr: 0.000410, top1: 0.79167, throughput: 313.19 | 2022-04-03 13:39:28.319 [rank:5] [train], epoch: 49/50, iter: 400/834, loss: 0.23258, lr: 0.000410, top1: 0.78531, throughput: 313.06 | 2022-04-03 13:39:28.320 [rank:3] [train], epoch: 49/50, iter: 400/834, loss: 0.23314, lr: 0.000410, top1: 0.79010, throughput: 313.29 | 2022-04-03 13:39:28.329 [rank:6] [train], epoch: 49/50, iter: 400/834, loss: 0.23207, lr: 0.000410, top1: 0.78974, throughput: 313.23 | 2022-04-03 13:39:28.338 [rank:7] [train], epoch: 49/50, iter: 400/834, loss: 0.23227, lr: 0.000410, top1: 0.78609, throughput: 313.15 | 2022-04-03 13:39:28.347 [rank:4] [train], epoch: 49/50, iter: 400/834, loss: 0.23122, lr: 0.000410, top1: 0.79021, throughput: 312.91 | 2022-04-03 13:39:28.354 [rank:1] [train], epoch: 49/50, iter: 500/834, loss: 0.23236, lr: 0.000243, top1: 0.79266, throughput: 311.87 | 2022-04-03 13:40:29.865 [rank:7] [train], epoch: 49/50, iter: 500/834, loss: 0.23423, lr: 0.000243, top1: 0.78531, throughput: 312.00 | 2022-04-03 13:40:29.885 [rank:0] [train], epoch: 49/50, iter: 500/834, loss: 0.23144, lr: 0.000243, top1: 0.78911, throughput: 311.70 | 2022-04-03 13:40:29.892 [rank:2] [train], epoch: 49/50, iter: 500/834, loss: 0.23338, lr: 0.000243, top1: 0.78651, throughput: 311.75 | 2022-04-03 13:40:29.907 [rank:5] [train], epoch: 49/50, iter: 500/834, loss: 0.23144, lr: 0.000243, top1: 0.78974, throughput: 311.75 | 2022-04-03 13:40:29.907 [rank:3] [train], epoch: 49/50, iter: 500/834, loss: 0.23003, lr: 0.000243, top1: 0.79031, throughput: 311.79 | 2022-04-03 13:40:29.908 [rank:4] [train], epoch: 49/50, iter: 500/834, loss: 0.23349, lr: 0.000243, top1: 0.78505, throughput: 311.90 | 2022-04-03 13:40:29.913 [rank:6] [train], epoch: 49/50, iter: 500/834, loss: 0.23358, lr: 0.000243, top1: 0.78318, throughput: 311.79 | 2022-04-03 13:40:29.919 [rank:6] [train], epoch: 49/50, iter: 600/834, loss: 0.23497, lr: 0.000119, top1: 0.78234, throughput: 314.71 | 2022-04-03 13:41:30.926 [rank:2] [train], epoch: 49/50, iter: 600/834, loss: 0.23289, lr: 0.000119, top1: 0.78557, throughput: 314.59 | 2022-04-03 13:41:30.939 [rank:4] [train], epoch: 49/50, iter: 600/834, loss: 0.23216, lr: 0.000119, top1: 0.79000, throughput: 314.51 | 2022-04-03 13:41:30.960 [rank:0] [train], epoch: 49/50, iter: 600/834, loss: 0.23173, lr: 0.000119, top1: 0.79021, throughput: 314.39 | 2022-04-03 13:41:30.962 [rank:7] [train], epoch: 49/50, iter: 600/834, loss: 0.23364, lr: 0.000119, top1: 0.78557, throughput: 314.32 | 2022-04-03 13:41:30.969 [rank:3] [train], epoch: 49/50, iter: 600/834, loss: 0.23193, lr: 0.000119, top1: 0.78859, throughput: 314.36 | 2022-04-03 13:41:30.985 [rank:1] [train], epoch: 49/50, iter: 600/834, loss: 0.23275, lr: 0.000119, top1: 0.78745, throughput: 314.12 | 2022-04-03 13:41:30.989 [rank:5] [train], epoch: 49/50, iter: 600/834, loss: 0.23316, lr: 0.000119, top1: 0.78568, throughput: 314.31 | 2022-04-03 13:41:30.994 [rank:6] [train], epoch: 49/50, iter: 700/834, loss: 0.23222, lr: 0.000039, top1: 0.78854, throughput: 313.04 | 2022-04-03 13:42:32.260 [rank:7] [train], epoch: 49/50, iter: 700/834, loss: 0.23252, lr: 0.000039, top1: 0.78724, throughput: 313.23 | 2022-04-03 13:42:32.267 [rank:3] [train], epoch: 49/50, iter: 700/834, loss: 0.23253, lr: 0.000039, top1: 0.78583, throughput: 313.21 | 2022-04-03 13:42:32.287 [rank:0] [train], epoch: 49/50, iter: 700/834, loss: 0.23191, lr: 0.000039, top1: 0.79063, throughput: 313.08 | 2022-04-03 13:42:32.287 [rank:4] [train], epoch: 49/50, iter: 700/834, loss: 0.23265, lr: 0.000039, top1: 0.78885, throughput: 313.07 | 2022-04-03 13:42:32.288 [rank:5] [train], epoch: 49/50, iter: 700/834, loss: 0.23059, lr: 0.000039, top1: 0.79151, throughput: 313.20 | 2022-04-03 13:42:32.298 [rank:2] [train], epoch: 49/50, iter: 700/834, loss: 0.23179, lr: 0.000039, top1: 0.78932, throughput: 312.88 | 2022-04-03 13:42:32.304 [rank:1] [train], epoch: 49/50, iter: 700/834, loss: 0.23270, lr: 0.000039, top1: 0.78661, throughput: 313.08 | 2022-04-03 13:42:32.316 [rank:7] [train], epoch: 49/50, iter: 800/834, loss: 0.23270, lr: 0.000003, top1: 0.78542, throughput: 313.69 | 2022-04-03 13:43:33.474 [rank:1] [train], epoch: 49/50, iter: 800/834, loss: 0.23098, lr: 0.000003, top1: 0.79156, throughput: 313.92 | 2022-04-03 13:43:33.478 [rank:2] [train], epoch: 49/50, iter: 800/834, loss: 0.23222, lr: 0.000003, top1: 0.78797, throughput: 313.85 | 2022-04-03 13:43:33.480 [rank:3] [train], epoch: 49/50, iter: 800/834, loss: 0.23160, lr: 0.000003, top1: 0.78854, throughput: 313.76 | 2022-04-03 13:43:33.480 [rank:6] [train], epoch: 49/50, iter: 800/834, loss: 0.23351, lr: 0.000003, top1: 0.78552, throughput: 313.44 | 2022-04-03 13:43:33.515 [rank:5] [train], epoch: 49/50, iter: 800/834, loss: 0.23059, lr: 0.000003, top1: 0.78979, throughput: 313.64 | 2022-04-03 13:43:33.516 [rank:0] [train], epoch: 49/50, iter: 800/834, loss: 0.23058, lr: 0.000003, top1: 0.79219, throughput: 313.51 | 2022-04-03 13:43:33.530 [rank:4] [train], epoch: 49/50, iter: 800/834, loss: 0.23368, lr: 0.000003, top1: 0.78661, throughput: 313.84 | 2022-04-03 13:43:33.466 [rank:1] [train], epoch: 49/50, iter: 834/834, loss: 0.23281, lr: 0.000000, top1: 0.78339, throughput: 309.11 | 2022-04-03 13:43:54.597 [rank:2] [train], epoch: 49/50, iter: 834/834, loss: 0.22966, lr: 0.000000, top1: 0.79151, throughput: 309.13 | 2022-04-03 13:43:54.597 [rank:6] [train], epoch: 49/50, iter: 834/834, loss: 0.23188, lr: 0.000000, top1: 0.78860, throughput: 309.48 | 2022-04-03 13:43:54.608 [rank:3] [train], epoch: 49/50, iter: 834/834, loss: 0.23224, lr: 0.000000, top1: 0.79151, throughput: 308.90 | 2022-04-03 13:43:54.613 [rank:4] [train], epoch: 49/50, iter: 834/834, loss: 0.22867, lr: 0.000000, top1: 0.79550, throughput: 308.60 | 2022-04-03 13:43:54.619 [rank:5] [train], epoch: 49/50, iter: 834/834, loss: 0.23314, lr: 0.000000, top1: 0.79182, throughput: 309.30 | 2022-04-03 13:43:54.622 [rank:0] [train], epoch: 49/50, iter: 834/834, loss: 0.23603, lr: 0.000000, top1: 0.78110, throughput: 309.22 | 2022-04-03 13:43:54.641 [rank:7] [train], epoch: 49/50, iter: 834/834, loss: 0.23212, lr: 0.000000, top1: 0.78738, throughput: 308.34 | 2022-04-03 13:43:54.645 [rank:0] [eval], epoch: 49/50, iter: 125/125, loss: 0.00000, lr: 0.000000, top1: 0.76544, throughput: 488.35 | 2022-04-03 13:44:07.439 [rank:3] [eval], epoch: 49/50, iter: 125/125, loss: 0.00000, lr: 0.000000, top1: 0.75936, throughput: 486.85 | 2022-04-03 13:44:07.451 [rank:7] [eval], epoch: 49/50, iter: 125/125, loss: 0.00000, lr: 0.000000, top1: 0.76768, throughput: 487.58 | 2022-04-03 13:44:07.464 [rank:4] [eval], epoch: 49/50, iter: 125/125, loss: 0.00000, lr: 0.000000, top1: 0.76336, throughput: 486.60 | 2022-04-03 13:44:07.464 [rank:1] [eval], epoch: 49/50, iter: 125/125, loss: 0.00000, lr: 0.000000, top1: 0.76944, throughput: 485.61 | 2022-04-03 13:44:07.467 [rank:2] [eval], epoch: 49/50, iter: 125/125, loss: 0.00000, lr: 0.000000, top1: 0.75648, throughput: 484.47 | 2022-04-03 13:44:07.498 [rank:5] [eval], epoch: 49/50, iter: 125/125, loss: 0.00000, lr: 0.000000, top1: 0.75456, throughput: 485.30 | 2022-04-03 13:44:07.500 [rank:6] [eval], epoch: 49/50, iter: 125/125, loss: 0.00000, lr: 0.000000, top1: 0.76448, throughput: 484.15 | 2022-04-03 13:44:07.518